[
{
"page_no": 0,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.3,
"r_y0": 119.93,
"r_x1": 498.93,
"r_y1": 119.93,
"r_x2": 498.93,
"r_y2": 107.03,
"r_x3": 96.3,
"r_y3": 107.03,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers.",
"orig": "TableFormer: Table Structure Understanding with Transformers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.48,
"r_y0": 157.37,
"r_x1": 452.75,
"r_y1": 157.37,
"r_x2": 452.75,
"r_y2": 146.69,
"r_x3": 142.48,
"r_y3": 146.69,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.92,
"r_y0": 171.32,
"r_x1": 332.31,
"r_y1": 171.32,
"r_x2": 332.31,
"r_y2": 160.63,
"r_x3": 262.92,
"r_y3": 160.63,
"coord_origin": "TOPLEFT"
},
"text": "IBM Research",
"orig": "IBM Research",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.12,
"r_y0": 184.43,
"r_x1": 212.73,
"r_y1": 184.43,
"r_x2": 212.73,
"r_y2": 175.96,
"r_x3": 208.12,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.73,
"r_y0": 184.0,
"r_x1": 293.43,
"r_y1": 184.0,
"r_x2": 293.43,
"r_y2": 177.08,
"r_x3": 212.73,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.43,
"r_y0": 184.43,
"r_x1": 298.04,
"r_y1": 184.43,
"r_x2": 298.04,
"r_y2": 175.96,
"r_x3": 293.43,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.03,
"r_y0": 184.0,
"r_x1": 378.73,
"r_y1": 184.0,
"r_x2": 378.73,
"r_y2": 177.08,
"r_x3": 298.03,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.99,
"r_y0": 226.23,
"r_x1": 190.48,
"r_y1": 226.23,
"r_x2": 190.48,
"r_y2": 215.48,
"r_x3": 145.99,
"r_y3": 215.48,
"coord_origin": "TOPLEFT"
},
"text": "Abstract",
"orig": "Abstract",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 249.98,
"r_x1": 286.36,
"r_y1": 249.98,
"r_x2": 286.36,
"r_y2": 241.4,
"r_x3": 62.07,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Tables organize valuable content in a concise and com-",
"orig": "Tables organize valuable content in a concise and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 261.94,
"r_x1": 286.37,
"r_y1": 261.94,
"r_x2": 286.37,
"r_y2": 253.35,
"r_x3": 50.11,
"r_y3": 253.35,
"coord_origin": "TOPLEFT"
},
"text": "pact representation. This content is extremely valuable for",
"orig": "pact representation. This content is extremely valuable for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 273.89,
"r_x1": 286.37,
"r_y1": 273.89,
"r_x2": 286.37,
"r_y2": 265.31,
"r_x3": 50.11,
"r_y3": 265.31,
"coord_origin": "TOPLEFT"
},
"text": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"orig": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 285.85,
"r_x1": 286.37,
"r_y1": 285.85,
"r_x2": 286.37,
"r_y2": 277.26,
"r_x3": 50.11,
"r_y3": 277.26,
"coord_origin": "TOPLEFT"
},
"text": "since they enhance their predictive capabilities. Unfortu-",
"orig": "since they enhance their predictive capabilities. Unfortu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 297.8,
"r_x1": 286.37,
"r_y1": 297.8,
"r_x2": 286.37,
"r_y2": 289.22,
"r_x3": 50.11,
"r_y3": 289.22,
"coord_origin": "TOPLEFT"
},
"text": "nately, tables come in a large variety of shapes and sizes.",
"orig": "nately, tables come in a large variety of shapes and sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 309.76,
"r_x1": 286.37,
"r_y1": 309.76,
"r_x2": 286.37,
"r_y2": 301.17,
"r_x3": 50.11,
"r_y3": 301.17,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, they can have complex column/row-header",
"orig": "Furthermore, they can have complex column/row-header",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 321.71,
"r_x1": 286.37,
"r_y1": 321.71,
"r_x2": 286.37,
"r_y2": 313.13,
"r_x3": 50.11,
"r_y3": 313.13,
"coord_origin": "TOPLEFT"
},
"text": "configurations, multiline rows, different variety of separa-",
"orig": "configurations, multiline rows, different variety of separa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 333.67,
"r_x1": 286.37,
"r_y1": 333.67,
"r_x2": 286.37,
"r_y2": 325.08,
"r_x3": 50.11,
"r_y3": 325.08,
"coord_origin": "TOPLEFT"
},
"text": "tion lines, missing entries, etc. As such, the correct iden-",
"orig": "tion lines, missing entries, etc. As such, the correct iden-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 345.62,
"r_x1": 286.37,
"r_y1": 345.62,
"r_x2": 286.37,
"r_y2": 337.04,
"r_x3": 50.11,
"r_y3": 337.04,
"coord_origin": "TOPLEFT"
},
"text": "tification of the table-structure from an image is a non-",
"orig": "tification of the table-structure from an image is a non-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 357.58,
"r_x1": 286.37,
"r_y1": 357.58,
"r_x2": 286.37,
"r_y2": 348.99,
"r_x3": 50.11,
"r_y3": 348.99,
"coord_origin": "TOPLEFT"
},
"text": "trivial task. In this paper, we present a new table-structure",
"orig": "trivial task. In this paper, we present a new table-structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 369.53,
"r_x1": 286.37,
"r_y1": 369.53,
"r_x2": 286.37,
"r_y2": 360.95,
"r_x3": 50.11,
"r_y3": 360.95,
"coord_origin": "TOPLEFT"
},
"text": "identification model. The latter improves the latest end-to-",
"orig": "identification model. The latter improves the latest end-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 381.49,
"r_x1": 286.37,
"r_y1": 381.49,
"r_x2": 286.37,
"r_y2": 372.9,
"r_x3": 50.11,
"r_y3": 372.9,
"coord_origin": "TOPLEFT"
},
"text": "end deep learning model (i.e. encoder-dual-decoder from",
"orig": "end deep learning model (i.e. encoder-dual-decoder from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 393.44,
"r_x1": 286.37,
"r_y1": 393.44,
"r_x2": 286.37,
"r_y2": 384.86,
"r_x3": 50.11,
"r_y3": 384.86,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet) in two significant ways. First, we introduce a",
"orig": "PubTabNet) in two significant ways. First, we introduce a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 405.4,
"r_x1": 286.37,
"r_y1": 405.4,
"r_x2": 286.37,
"r_y2": 396.81,
"r_x3": 50.11,
"r_y3": 396.81,
"coord_origin": "TOPLEFT"
},
"text": "new object detection decoder for table-cells. In this way,",
"orig": "new object detection decoder for table-cells. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 417.35,
"r_x1": 286.37,
"r_y1": 417.35,
"r_x2": 286.37,
"r_y2": 408.77,
"r_x3": 50.11,
"r_y3": 408.77,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the content of the table-cells from program-",
"orig": "we can obtain the content of the table-cells from program-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 429.31,
"r_x1": 286.37,
"r_y1": 429.31,
"r_x2": 286.37,
"r_y2": 420.72,
"r_x3": 50.11,
"r_y3": 420.72,
"coord_origin": "TOPLEFT"
},
"text": "matic PDF\u2019s directly from the PDF source and avoid the",
"orig": "matic PDF\u2019s directly from the PDF source and avoid the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 441.27,
"r_x1": 207.23,
"r_y1": 441.27,
"r_x2": 207.23,
"r_y2": 432.68,
"r_x3": 50.11,
"r_y3": 432.68,
"coord_origin": "TOPLEFT"
},
"text": "training of the custom OCR decoders.",
"orig": "training of the custom OCR decoders.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.1,
"r_y0": 441.27,
"r_x1": 286.37,
"r_y1": 441.27,
"r_x2": 286.37,
"r_y2": 432.68,
"r_x3": 214.1,
"r_y3": 432.68,
"coord_origin": "TOPLEFT"
},
"text": "This architectural",
"orig": "This architectural",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 453.22,
"r_x1": 286.37,
"r_y1": 453.22,
"r_x2": 286.37,
"r_y2": 444.63,
"r_x3": 50.11,
"r_y3": 444.63,
"coord_origin": "TOPLEFT"
},
"text": "change leads to more accurate table-content extraction and",
"orig": "change leads to more accurate table-content extraction and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 465.18,
"r_x1": 286.37,
"r_y1": 465.18,
"r_x2": 286.37,
"r_y2": 456.59,
"r_x3": 50.11,
"r_y3": 456.59,
"coord_origin": "TOPLEFT"
},
"text": "allows us to tackle non-english tables. Second, we replace",
"orig": "allows us to tackle non-english tables. Second, we replace",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 477.13,
"r_x1": 286.37,
"r_y1": 477.13,
"r_x2": 286.37,
"r_y2": 468.54,
"r_x3": 50.11,
"r_y3": 468.54,
"coord_origin": "TOPLEFT"
},
"text": "the LSTM decoders with transformer based decoders. This",
"orig": "the LSTM decoders with transformer based decoders. This",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 489.09,
"r_x1": 286.37,
"r_y1": 489.09,
"r_x2": 286.37,
"r_y2": 480.5,
"r_x3": 50.11,
"r_y3": 480.5,
"coord_origin": "TOPLEFT"
},
"text": "upgrade improves significantly the previous state-of-the-art",
"orig": "upgrade improves significantly the previous state-of-the-art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 501.04,
"r_x1": 286.37,
"r_y1": 501.04,
"r_x2": 286.37,
"r_y2": 492.45,
"r_x3": 50.11,
"r_y3": 492.45,
"coord_origin": "TOPLEFT"
},
"text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 513.0,
"r_x1": 276.65,
"r_y1": 513.0,
"r_x2": 276.65,
"r_y2": 504.41,
"r_x3": 50.11,
"r_y3": 504.41,
"coord_origin": "TOPLEFT"
},
"text": "simple tables and from 88.7% to 95% on complex tables.",
"orig": "simple tables and from 88.7% to 95% on complex tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 550.69,
"r_x1": 58.12,
"r_y1": 550.69,
"r_x2": 58.12,
"r_y2": 539.94,
"r_x3": 50.11,
"r_y3": 539.94,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.8,
"r_y0": 550.69,
"r_x1": 126.95,
"r_y1": 550.69,
"r_x2": 126.95,
"r_y2": 539.94,
"r_x3": 68.8,
"r_y3": 539.94,
"coord_origin": "TOPLEFT"
},
"text": "Introduction",
"orig": "Introduction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 569.69,
"r_x1": 286.36,
"r_y1": 569.69,
"r_x2": 286.36,
"r_y2": 560.78,
"r_x3": 62.07,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "The occurrence of tables in documents is ubiquitous.",
"orig": "The occurrence of tables in documents is ubiquitous.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 581.64,
"r_x1": 286.37,
"r_y1": 581.64,
"r_x2": 286.37,
"r_y2": 572.74,
"r_x3": 50.11,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "They often summarise quantitative or factual data, which is",
"orig": "They often summarise quantitative or factual data, which is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 593.6,
"r_x1": 286.37,
"r_y1": 593.6,
"r_x2": 286.37,
"r_y2": 584.69,
"r_x3": 50.11,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "cumbersome to describe in verbose text but nevertheless ex-",
"orig": "cumbersome to describe in verbose text but nevertheless ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 605.56,
"r_x1": 286.37,
"r_y1": 605.56,
"r_x2": 286.37,
"r_y2": 596.65,
"r_x3": 50.11,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "tremely valuable. Unfortunately, this compact representa-",
"orig": "tremely valuable. Unfortunately, this compact representa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 617.51,
"r_x1": 286.37,
"r_y1": 617.51,
"r_x2": 286.37,
"r_y2": 608.6,
"r_x3": 50.11,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "tion is often not easy to parse by machines. There are many",
"orig": "tion is often not easy to parse by machines. There are many",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 629.47,
"r_x1": 286.37,
"r_y1": 629.47,
"r_x2": 286.37,
"r_y2": 620.56,
"r_x3": 50.11,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "implicit conventions used to obtain a compact table repre-",
"orig": "implicit conventions used to obtain a compact table repre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 641.42,
"r_x1": 286.37,
"r_y1": 641.42,
"r_x2": 286.37,
"r_y2": 632.51,
"r_x3": 50.11,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "sentation. For example, tables often have complex column-",
"orig": "sentation. For example, tables often have complex column-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "and row-headers in order to reduce duplicated cell content.",
"orig": "and row-headers in order to reduce duplicated cell content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 50.11,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "Lines of different shapes and sizes are leveraged to separate",
"orig": "Lines of different shapes and sizes are leveraged to separate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "content or indicate a tree structure. Additionally, tables can",
"orig": "content or indicate a tree structure. Additionally, tables can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "also have empty/missing table-entries or multi-row textual",
"orig": "also have empty/missing table-entries or multi-row textual",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "table-entries. Fig. 1 shows a table which presents all these",
"orig": "table-entries. Fig. 1 shows a table which presents all these",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 76.4,
"r_y1": 713.15,
"r_x2": 76.4,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "issues.",
"orig": "issues.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 226.75,
"r_x1": 324.01,
"r_y1": 226.75,
"r_x2": 324.01,
"r_y2": 218.01,
"r_x3": 315.57,
"r_y3": 218.01,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.23,
"r_y0": 226.75,
"r_x1": 408.44,
"r_y1": 226.75,
"r_x2": 408.44,
"r_y2": 218.01,
"r_x3": 328.23,
"r_y3": 218.01,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table:",
"orig": "Picture of a table:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 322.44,
"r_x1": 325.06,
"r_y1": 322.44,
"r_x2": 325.06,
"r_y2": 313.69,
"r_x3": 315.57,
"r_y3": 313.69,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.8,
"r_y0": 322.44,
"r_x1": 486.4,
"r_y1": 322.44,
"r_x2": 486.4,
"r_y2": 313.69,
"r_x3": 329.8,
"r_y3": 313.69,
"coord_origin": "TOPLEFT"
},
"text": "Red-annotation of bounding boxes,",
"orig": "Red-annotation of bounding boxes,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.46,
"r_y0": 333.24,
"r_x1": 472.47,
"r_y1": 333.24,
"r_x2": 472.47,
"r_y2": 324.49,
"r_x3": 326.46,
"r_y3": 324.49,
"coord_origin": "TOPLEFT"
},
"text": "Blue-predictions by TableFormer",
"orig": "Blue-predictions by TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 428.93,
"r_x1": 324.81,
"r_y1": 428.93,
"r_x2": 324.81,
"r_y2": 420.18,
"r_x3": 315.57,
"r_y3": 420.18,
"coord_origin": "TOPLEFT"
},
"text": "c.",
"orig": "c.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.43,
"r_y0": 428.93,
"r_x1": 491.19,
"r_y1": 428.93,
"r_x2": 491.19,
"r_y2": 420.18,
"r_x3": 329.43,
"r_y3": 420.18,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer:",
"orig": "Structure predicted by TableFormer:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.15,
"r_y0": 351.61,
"r_x1": 412.54,
"r_y1": 351.61,
"r_x2": 412.54,
"r_y2": 342.83,
"r_x3": 408.15,
"r_y3": 342.83,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.11,
"r_y0": 350.36,
"r_x1": 360.5,
"r_y1": 350.36,
"r_x2": 360.5,
"r_y2": 341.57,
"r_x3": 356.11,
"r_y3": 341.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.68,
"r_y0": 349.72,
"r_x1": 505.07,
"r_y1": 349.72,
"r_x2": 505.07,
"r_y2": 340.94,
"r_x3": 500.68,
"r_y3": 340.94,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.13,
"r_y0": 360.53,
"r_x1": 360.53,
"r_y1": 360.53,
"r_x2": 360.53,
"r_y2": 351.75,
"r_x3": 356.13,
"r_y3": 351.75,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.54,
"r_y0": 364.66,
"r_x1": 406.93,
"r_y1": 364.66,
"r_x2": 406.93,
"r_y2": 355.88,
"r_x3": 402.54,
"r_y3": 355.88,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.58,
"r_y0": 361.63,
"r_x1": 452.97,
"r_y1": 361.63,
"r_x2": 452.97,
"r_y2": 352.84,
"r_x3": 448.58,
"r_y3": 352.84,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.65,
"r_y0": 362.49,
"r_x1": 496.04,
"r_y1": 362.49,
"r_x2": 496.04,
"r_y2": 353.71,
"r_x3": 491.65,
"r_y3": 353.71,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.14,
"r_y0": 362.12,
"r_x1": 539.53,
"r_y1": 362.12,
"r_x2": 539.53,
"r_y2": 353.34,
"r_x3": 535.14,
"r_y3": 353.34,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.83,
"r_y0": 395.88,
"r_x1": 353.22,
"r_y1": 395.88,
"r_x2": 353.22,
"r_y2": 387.1,
"r_x3": 348.83,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.27,
"r_y0": 384.16,
"r_x1": 393.66,
"r_y1": 384.16,
"r_x2": 393.66,
"r_y2": 375.37,
"r_x3": 389.27,
"r_y3": 375.37,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.67,
"r_y0": 384.43,
"r_x1": 451.46,
"r_y1": 384.43,
"r_x2": 451.46,
"r_y2": 375.65,
"r_x3": 442.67,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.44,
"r_y0": 384.32,
"r_x1": 485.9,
"r_y1": 384.32,
"r_x2": 485.9,
"r_y2": 375.53,
"r_x3": 477.44,
"r_y3": 375.53,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.57,
"r_y0": 384.43,
"r_x1": 531.36,
"r_y1": 384.43,
"r_x2": 531.36,
"r_y2": 375.65,
"r_x3": 522.57,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.23,
"r_y0": 395.9,
"r_x1": 409.01,
"r_y1": 395.9,
"r_x2": 409.01,
"r_y2": 387.11,
"r_x3": 400.23,
"r_y3": 387.11,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 395.77,
"r_x1": 451.09,
"r_y1": 395.77,
"r_x2": 451.09,
"r_y2": 386.99,
"r_x3": 442.31,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.22,
"r_y0": 396.16,
"r_x1": 487.0,
"r_y1": 396.16,
"r_x2": 487.0,
"r_y2": 387.37,
"r_x3": 478.22,
"r_y3": 387.37,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.23,
"r_y0": 395.77,
"r_x1": 532.01,
"r_y1": 395.77,
"r_x2": 532.01,
"r_y2": 386.99,
"r_x3": 523.23,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.57,
"r_y0": 408.21,
"r_x1": 415.96,
"r_y1": 408.21,
"r_x2": 415.96,
"r_y2": 399.42,
"r_x3": 411.57,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.96,
"r_y0": 408.21,
"r_x1": 420.36,
"r_y1": 408.21,
"r_x2": 420.36,
"r_y2": 399.42,
"r_x3": 415.96,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 407.82,
"r_x1": 451.09,
"r_y1": 407.82,
"r_x2": 451.09,
"r_y2": 399.04,
"r_x3": 442.31,
"r_y3": 399.04,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.78,
"r_y0": 407.78,
"r_x1": 487.56,
"r_y1": 407.78,
"r_x2": 487.56,
"r_y2": 399.0,
"r_x3": 478.78,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.97,
"r_y0": 407.4,
"r_x1": 532.76,
"r_y1": 407.4,
"r_x2": 532.76,
"r_y2": 398.61,
"r_x3": 523.97,
"r_y3": 398.61,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.09,
"r_y0": 367.89,
"r_x1": 391.1,
"r_y1": 367.89,
"r_x2": 391.1,
"r_y2": 357.76,
"r_x3": 385.09,
"r_y3": 357.76,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.43,
"r_y0": 390.86,
"r_x1": 339.44,
"r_y1": 390.86,
"r_x2": 339.44,
"r_y2": 380.73,
"r_x3": 333.43,
"r_y3": 380.73,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.07,
"r_y0": 351.17,
"r_x1": 484.08,
"r_y1": 351.17,
"r_x2": 484.08,
"r_y2": 341.04,
"r_x3": 478.07,
"r_y3": 341.04,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 523.41,
"r_x1": 345.73,
"r_y1": 523.41,
"r_x2": 345.73,
"r_y2": 514.5,
"r_x3": 308.86,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 1:",
"orig": "Figure 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 353.18,
"r_y0": 523.41,
"r_x1": 545.12,
"r_y1": 523.41,
"r_x2": 545.12,
"r_y2": 514.5,
"r_x3": 353.18,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table with subtle, complex features",
"orig": "Picture of a table with subtle, complex features",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 535.36,
"r_x1": 545.12,
"r_y1": 535.36,
"r_x2": 545.12,
"r_y2": 526.46,
"r_x3": 308.86,
"r_y3": 526.46,
"coord_origin": "TOPLEFT"
},
"text": "such as (1) multi-column headers, (2) cell with multi-row",
"orig": "such as (1) multi-column headers, (2) cell with multi-row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 547.32,
"r_x1": 545.12,
"r_y1": 547.32,
"r_x2": 545.12,
"r_y2": 538.41,
"r_x3": 308.86,
"r_y3": 538.41,
"coord_origin": "TOPLEFT"
},
"text": "text and (3) cells with no content. Image from PubTabNet",
"orig": "text and (3) cells with no content. Image from PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 559.27,
"r_x1": 505.69,
"r_y1": 559.27,
"r_x2": 505.69,
"r_y2": 550.37,
"r_x3": 308.86,
"r_y3": 550.37,
"coord_origin": "TOPLEFT"
},
"text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 593.32,
"r_x1": 545.11,
"r_y1": 593.32,
"r_x2": 545.11,
"r_y2": 584.41,
"r_x3": 320.82,
"r_y3": 584.41,
"coord_origin": "TOPLEFT"
},
"text": "Recently, significant progress has been made with vi-",
"orig": "Recently, significant progress has been made with vi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.27,
"r_x1": 545.12,
"r_y1": 605.27,
"r_x2": 545.12,
"r_y2": 596.36,
"r_x3": 308.86,
"r_y3": 596.36,
"coord_origin": "TOPLEFT"
},
"text": "sion based approaches to extract tables in documents. For",
"orig": "sion based approaches to extract tables in documents. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.23,
"r_x1": 545.12,
"r_y1": 617.23,
"r_x2": 545.12,
"r_y2": 608.32,
"r_x3": 308.86,
"r_y3": 608.32,
"coord_origin": "TOPLEFT"
},
"text": "the sake of completeness, the issue of table extraction from",
"orig": "the sake of completeness, the issue of table extraction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.18,
"r_x1": 545.12,
"r_y1": 629.18,
"r_x2": 545.12,
"r_y2": 620.27,
"r_x3": 308.86,
"r_y3": 620.27,
"coord_origin": "TOPLEFT"
},
"text": "documents is typically decomposed into two separate chal-",
"orig": "documents is typically decomposed into two separate chal-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.14,
"r_x1": 353.69,
"r_y1": 641.14,
"r_x2": 353.69,
"r_y2": 632.23,
"r_x3": 308.86,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "lenges, i.e.",
"orig": "lenges, i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 362.11,
"r_y0": 641.14,
"r_x1": 374.67,
"r_y1": 641.14,
"r_x2": 374.67,
"r_y2": 632.23,
"r_x3": 362.11,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.36,
"r_y0": 641.14,
"r_x1": 545.12,
"r_y1": 641.14,
"r_x2": 545.12,
"r_y2": 632.23,
"r_x3": 377.36,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "finding the location of the table(s) on a",
"orig": "finding the location of the table(s) on a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.09,
"r_x1": 545.12,
"r_y1": 653.09,
"r_x2": 545.12,
"r_y2": 644.19,
"r_x3": 308.86,
"r_y3": 644.19,
"coord_origin": "TOPLEFT"
},
"text": "document-page and (2) finding the structure of a given table",
"orig": "document-page and (2) finding the structure of a given table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.05,
"r_x1": 375.55,
"r_y1": 665.05,
"r_x2": 375.55,
"r_y2": 656.14,
"r_x3": 308.86,
"r_y3": 656.14,
"coord_origin": "TOPLEFT"
},
"text": "in the document.",
"orig": "in the document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 320.82,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "The first problem is called table-location and has been",
"orig": "The first problem is called table-location and has been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art object-detection networks (e.g. YOLO and later",
"orig": "of-the-art object-detection networks (e.g. YOLO and later",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.11,
"r_y1": 713.15,
"r_x2": 545.11,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "on Mask-RCNN [9]). For all practical purposes, it can be",
"orig": "on Mask-RCNN [9]). For all practical purposes, it can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 18.34,
"r_y0": 560.0,
"r_x1": 36.34,
"r_y1": 560.0,
"r_x2": 36.34,
"r_y2": 207.82,
"r_x3": 18.34,
"r_y3": 207.82,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 8,
"label": "section_header",
"bbox": {
"l": 96.3,
"t": 107.03,
"r": 498.93,
"b": 119.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.887,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.3,
"r_y0": 119.93,
"r_x1": 498.93,
"r_y1": 119.93,
"r_x2": 498.93,
"r_y2": 107.03,
"r_x3": 96.3,
"r_y3": 107.03,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers.",
"orig": "TableFormer: Table Structure Understanding with Transformers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "section_header",
"bbox": {
"l": 142.48,
"t": 146.69,
"r": 452.75,
"b": 171.32,
"coord_origin": "TOPLEFT"
},
"confidence": 0.759,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.48,
"r_y0": 157.37,
"r_x1": 452.75,
"r_y1": 157.37,
"r_x2": 452.75,
"r_y2": 146.69,
"r_x3": 142.48,
"r_y3": 146.69,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.92,
"r_y0": 171.32,
"r_x1": 332.31,
"r_y1": 171.32,
"r_x2": 332.31,
"r_y2": 160.63,
"r_x3": 262.92,
"r_y3": 160.63,
"coord_origin": "TOPLEFT"
},
"text": "IBM Research",
"orig": "IBM Research",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "key_value_region",
"bbox": {
"l": 208.12,
"t": 175.96,
"r": 378.73,
"b": 184.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.485,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.12,
"r_y0": 184.43,
"r_x1": 212.73,
"r_y1": 184.43,
"r_x2": 212.73,
"r_y2": 175.96,
"r_x3": 208.12,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.73,
"r_y0": 184.0,
"r_x1": 293.43,
"r_y1": 184.0,
"r_x2": 293.43,
"r_y2": 177.08,
"r_x3": 212.73,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.43,
"r_y0": 184.43,
"r_x1": 298.04,
"r_y1": 184.43,
"r_x2": 298.04,
"r_y2": 175.96,
"r_x3": 293.43,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.03,
"r_y0": 184.0,
"r_x1": 378.73,
"r_y1": 184.0,
"r_x2": 378.73,
"r_y2": 177.08,
"r_x3": 298.03,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 7,
"label": "text",
"bbox": {
"l": 208.12,
"t": 175.96,
"r": 378.73,
"b": 184.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.12,
"r_y0": 184.43,
"r_x1": 212.73,
"r_y1": 184.43,
"r_x2": 212.73,
"r_y2": 175.96,
"r_x3": 208.12,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.73,
"r_y0": 184.0,
"r_x1": 293.43,
"r_y1": 184.0,
"r_x2": 293.43,
"r_y2": 177.08,
"r_x3": 212.73,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.43,
"r_y0": 184.43,
"r_x1": 298.04,
"r_y1": 184.43,
"r_x2": 298.04,
"r_y2": 175.96,
"r_x3": 293.43,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.03,
"r_y0": 184.0,
"r_x1": 378.73,
"r_y1": 184.0,
"r_x2": 378.73,
"r_y2": 177.08,
"r_x3": 298.03,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 5,
"label": "section_header",
"bbox": {
"l": 145.99,
"t": 215.48,
"r": 190.48,
"b": 226.23,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.99,
"r_y0": 226.23,
"r_x1": 190.48,
"r_y1": 226.23,
"r_x2": 190.48,
"r_y2": 215.48,
"r_x3": 145.99,
"r_y3": 215.48,
"coord_origin": "TOPLEFT"
},
"text": "Abstract",
"orig": "Abstract",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 241.4,
"r": 286.37,
"b": 513.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 249.98,
"r_x1": 286.36,
"r_y1": 249.98,
"r_x2": 286.36,
"r_y2": 241.4,
"r_x3": 62.07,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Tables organize valuable content in a concise and com-",
"orig": "Tables organize valuable content in a concise and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 261.94,
"r_x1": 286.37,
"r_y1": 261.94,
"r_x2": 286.37,
"r_y2": 253.35,
"r_x3": 50.11,
"r_y3": 253.35,
"coord_origin": "TOPLEFT"
},
"text": "pact representation. This content is extremely valuable for",
"orig": "pact representation. This content is extremely valuable for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 273.89,
"r_x1": 286.37,
"r_y1": 273.89,
"r_x2": 286.37,
"r_y2": 265.31,
"r_x3": 50.11,
"r_y3": 265.31,
"coord_origin": "TOPLEFT"
},
"text": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"orig": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 285.85,
"r_x1": 286.37,
"r_y1": 285.85,
"r_x2": 286.37,
"r_y2": 277.26,
"r_x3": 50.11,
"r_y3": 277.26,
"coord_origin": "TOPLEFT"
},
"text": "since they enhance their predictive capabilities. Unfortu-",
"orig": "since they enhance their predictive capabilities. Unfortu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 297.8,
"r_x1": 286.37,
"r_y1": 297.8,
"r_x2": 286.37,
"r_y2": 289.22,
"r_x3": 50.11,
"r_y3": 289.22,
"coord_origin": "TOPLEFT"
},
"text": "nately, tables come in a large variety of shapes and sizes.",
"orig": "nately, tables come in a large variety of shapes and sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 309.76,
"r_x1": 286.37,
"r_y1": 309.76,
"r_x2": 286.37,
"r_y2": 301.17,
"r_x3": 50.11,
"r_y3": 301.17,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, they can have complex column/row-header",
"orig": "Furthermore, they can have complex column/row-header",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 321.71,
"r_x1": 286.37,
"r_y1": 321.71,
"r_x2": 286.37,
"r_y2": 313.13,
"r_x3": 50.11,
"r_y3": 313.13,
"coord_origin": "TOPLEFT"
},
"text": "configurations, multiline rows, different variety of separa-",
"orig": "configurations, multiline rows, different variety of separa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 333.67,
"r_x1": 286.37,
"r_y1": 333.67,
"r_x2": 286.37,
"r_y2": 325.08,
"r_x3": 50.11,
"r_y3": 325.08,
"coord_origin": "TOPLEFT"
},
"text": "tion lines, missing entries, etc. As such, the correct iden-",
"orig": "tion lines, missing entries, etc. As such, the correct iden-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 345.62,
"r_x1": 286.37,
"r_y1": 345.62,
"r_x2": 286.37,
"r_y2": 337.04,
"r_x3": 50.11,
"r_y3": 337.04,
"coord_origin": "TOPLEFT"
},
"text": "tification of the table-structure from an image is a non-",
"orig": "tification of the table-structure from an image is a non-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 357.58,
"r_x1": 286.37,
"r_y1": 357.58,
"r_x2": 286.37,
"r_y2": 348.99,
"r_x3": 50.11,
"r_y3": 348.99,
"coord_origin": "TOPLEFT"
},
"text": "trivial task. In this paper, we present a new table-structure",
"orig": "trivial task. In this paper, we present a new table-structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 369.53,
"r_x1": 286.37,
"r_y1": 369.53,
"r_x2": 286.37,
"r_y2": 360.95,
"r_x3": 50.11,
"r_y3": 360.95,
"coord_origin": "TOPLEFT"
},
"text": "identification model. The latter improves the latest end-to-",
"orig": "identification model. The latter improves the latest end-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 381.49,
"r_x1": 286.37,
"r_y1": 381.49,
"r_x2": 286.37,
"r_y2": 372.9,
"r_x3": 50.11,
"r_y3": 372.9,
"coord_origin": "TOPLEFT"
},
"text": "end deep learning model (i.e. encoder-dual-decoder from",
"orig": "end deep learning model (i.e. encoder-dual-decoder from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 393.44,
"r_x1": 286.37,
"r_y1": 393.44,
"r_x2": 286.37,
"r_y2": 384.86,
"r_x3": 50.11,
"r_y3": 384.86,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet) in two significant ways. First, we introduce a",
"orig": "PubTabNet) in two significant ways. First, we introduce a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 405.4,
"r_x1": 286.37,
"r_y1": 405.4,
"r_x2": 286.37,
"r_y2": 396.81,
"r_x3": 50.11,
"r_y3": 396.81,
"coord_origin": "TOPLEFT"
},
"text": "new object detection decoder for table-cells. In this way,",
"orig": "new object detection decoder for table-cells. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 417.35,
"r_x1": 286.37,
"r_y1": 417.35,
"r_x2": 286.37,
"r_y2": 408.77,
"r_x3": 50.11,
"r_y3": 408.77,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the content of the table-cells from program-",
"orig": "we can obtain the content of the table-cells from program-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 429.31,
"r_x1": 286.37,
"r_y1": 429.31,
"r_x2": 286.37,
"r_y2": 420.72,
"r_x3": 50.11,
"r_y3": 420.72,
"coord_origin": "TOPLEFT"
},
"text": "matic PDF\u2019s directly from the PDF source and avoid the",
"orig": "matic PDF\u2019s directly from the PDF source and avoid the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 441.27,
"r_x1": 207.23,
"r_y1": 441.27,
"r_x2": 207.23,
"r_y2": 432.68,
"r_x3": 50.11,
"r_y3": 432.68,
"coord_origin": "TOPLEFT"
},
"text": "training of the custom OCR decoders.",
"orig": "training of the custom OCR decoders.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.1,
"r_y0": 441.27,
"r_x1": 286.37,
"r_y1": 441.27,
"r_x2": 286.37,
"r_y2": 432.68,
"r_x3": 214.1,
"r_y3": 432.68,
"coord_origin": "TOPLEFT"
},
"text": "This architectural",
"orig": "This architectural",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 453.22,
"r_x1": 286.37,
"r_y1": 453.22,
"r_x2": 286.37,
"r_y2": 444.63,
"r_x3": 50.11,
"r_y3": 444.63,
"coord_origin": "TOPLEFT"
},
"text": "change leads to more accurate table-content extraction and",
"orig": "change leads to more accurate table-content extraction and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 465.18,
"r_x1": 286.37,
"r_y1": 465.18,
"r_x2": 286.37,
"r_y2": 456.59,
"r_x3": 50.11,
"r_y3": 456.59,
"coord_origin": "TOPLEFT"
},
"text": "allows us to tackle non-english tables. Second, we replace",
"orig": "allows us to tackle non-english tables. Second, we replace",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 477.13,
"r_x1": 286.37,
"r_y1": 477.13,
"r_x2": 286.37,
"r_y2": 468.54,
"r_x3": 50.11,
"r_y3": 468.54,
"coord_origin": "TOPLEFT"
},
"text": "the LSTM decoders with transformer based decoders. This",
"orig": "the LSTM decoders with transformer based decoders. This",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 489.09,
"r_x1": 286.37,
"r_y1": 489.09,
"r_x2": 286.37,
"r_y2": 480.5,
"r_x3": 50.11,
"r_y3": 480.5,
"coord_origin": "TOPLEFT"
},
"text": "upgrade improves significantly the previous state-of-the-art",
"orig": "upgrade improves significantly the previous state-of-the-art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 501.04,
"r_x1": 286.37,
"r_y1": 501.04,
"r_x2": 286.37,
"r_y2": 492.45,
"r_x3": 50.11,
"r_y3": 492.45,
"coord_origin": "TOPLEFT"
},
"text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 513.0,
"r_x1": 276.65,
"r_y1": 513.0,
"r_x2": 276.65,
"r_y2": 504.41,
"r_x3": 50.11,
"r_y3": 504.41,
"coord_origin": "TOPLEFT"
},
"text": "simple tables and from 88.7% to 95% on complex tables.",
"orig": "simple tables and from 88.7% to 95% on complex tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 539.94,
"r": 126.95,
"b": 550.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.932,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 550.69,
"r_x1": 58.12,
"r_y1": 550.69,
"r_x2": 58.12,
"r_y2": 539.94,
"r_x3": 50.11,
"r_y3": 539.94,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.8,
"r_y0": 550.69,
"r_x1": 126.95,
"r_y1": 550.69,
"r_x2": 126.95,
"r_y2": 539.94,
"r_x3": 68.8,
"r_y3": 539.94,
"coord_origin": "TOPLEFT"
},
"text": "Introduction",
"orig": "Introduction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 560.78,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 569.69,
"r_x1": 286.36,
"r_y1": 569.69,
"r_x2": 286.36,
"r_y2": 560.78,
"r_x3": 62.07,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "The occurrence of tables in documents is ubiquitous.",
"orig": "The occurrence of tables in documents is ubiquitous.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 581.64,
"r_x1": 286.37,
"r_y1": 581.64,
"r_x2": 286.37,
"r_y2": 572.74,
"r_x3": 50.11,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "They often summarise quantitative or factual data, which is",
"orig": "They often summarise quantitative or factual data, which is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 593.6,
"r_x1": 286.37,
"r_y1": 593.6,
"r_x2": 286.37,
"r_y2": 584.69,
"r_x3": 50.11,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "cumbersome to describe in verbose text but nevertheless ex-",
"orig": "cumbersome to describe in verbose text but nevertheless ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 605.56,
"r_x1": 286.37,
"r_y1": 605.56,
"r_x2": 286.37,
"r_y2": 596.65,
"r_x3": 50.11,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "tremely valuable. Unfortunately, this compact representa-",
"orig": "tremely valuable. Unfortunately, this compact representa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 617.51,
"r_x1": 286.37,
"r_y1": 617.51,
"r_x2": 286.37,
"r_y2": 608.6,
"r_x3": 50.11,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "tion is often not easy to parse by machines. There are many",
"orig": "tion is often not easy to parse by machines. There are many",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 629.47,
"r_x1": 286.37,
"r_y1": 629.47,
"r_x2": 286.37,
"r_y2": 620.56,
"r_x3": 50.11,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "implicit conventions used to obtain a compact table repre-",
"orig": "implicit conventions used to obtain a compact table repre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 641.42,
"r_x1": 286.37,
"r_y1": 641.42,
"r_x2": 286.37,
"r_y2": 632.51,
"r_x3": 50.11,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "sentation. For example, tables often have complex column-",
"orig": "sentation. For example, tables often have complex column-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "and row-headers in order to reduce duplicated cell content.",
"orig": "and row-headers in order to reduce duplicated cell content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 50.11,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "Lines of different shapes and sizes are leveraged to separate",
"orig": "Lines of different shapes and sizes are leveraged to separate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "content or indicate a tree structure. Additionally, tables can",
"orig": "content or indicate a tree structure. Additionally, tables can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "also have empty/missing table-entries or multi-row textual",
"orig": "also have empty/missing table-entries or multi-row textual",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "table-entries. Fig. 1 shows a table which presents all these",
"orig": "table-entries. Fig. 1 shows a table which presents all these",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 76.4,
"r_y1": 713.15,
"r_x2": 76.4,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "issues.",
"orig": "issues.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "section_header",
"bbox": {
"l": 315.57,
"t": 218.01,
"r": 408.44,
"b": 226.75,
"coord_origin": "TOPLEFT"
},
"confidence": 0.672,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 226.75,
"r_x1": 324.01,
"r_y1": 226.75,
"r_x2": 324.01,
"r_y2": 218.01,
"r_x3": 315.57,
"r_y3": 218.01,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.23,
"r_y0": 226.75,
"r_x1": 408.44,
"r_y1": 226.75,
"r_x2": 408.44,
"r_y2": 218.01,
"r_x3": 328.23,
"r_y3": 218.01,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table:",
"orig": "Picture of a table:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "list_item",
"bbox": {
"l": 315.57,
"t": 313.69,
"r": 486.4,
"b": 333.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.555,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 322.44,
"r_x1": 325.06,
"r_y1": 322.44,
"r_x2": 325.06,
"r_y2": 313.69,
"r_x3": 315.57,
"r_y3": 313.69,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.8,
"r_y0": 322.44,
"r_x1": 486.4,
"r_y1": 322.44,
"r_x2": 486.4,
"r_y2": 313.69,
"r_x3": 329.8,
"r_y3": 313.69,
"coord_origin": "TOPLEFT"
},
"text": "Red-annotation of bounding boxes,",
"orig": "Red-annotation of bounding boxes,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.46,
"r_y0": 333.24,
"r_x1": 472.47,
"r_y1": 333.24,
"r_x2": 472.47,
"r_y2": 324.49,
"r_x3": 326.46,
"r_y3": 324.49,
"coord_origin": "TOPLEFT"
},
"text": "Blue-predictions by TableFormer",
"orig": "Blue-predictions by TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "list_item",
"bbox": {
"l": 315.57,
"t": 420.18,
"r": 491.19,
"b": 428.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 428.93,
"r_x1": 324.81,
"r_y1": 428.93,
"r_x2": 324.81,
"r_y2": 420.18,
"r_x3": 315.57,
"r_y3": 420.18,
"coord_origin": "TOPLEFT"
},
"text": "c.",
"orig": "c.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.43,
"r_y0": 428.93,
"r_x1": 491.19,
"r_y1": 428.93,
"r_x2": 491.19,
"r_y2": 420.18,
"r_x3": 329.43,
"r_y3": 420.18,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer:",
"orig": "Structure predicted by TableFormer:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "picture",
"bbox": {
"l": 314.78,
"t": 338.07,
"r": 539.18,
"b": 410.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.874,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.15,
"r_y0": 351.61,
"r_x1": 412.54,
"r_y1": 351.61,
"r_x2": 412.54,
"r_y2": 342.83,
"r_x3": 408.15,
"r_y3": 342.83,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.11,
"r_y0": 350.36,
"r_x1": 360.5,
"r_y1": 350.36,
"r_x2": 360.5,
"r_y2": 341.57,
"r_x3": 356.11,
"r_y3": 341.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.68,
"r_y0": 349.72,
"r_x1": 505.07,
"r_y1": 349.72,
"r_x2": 505.07,
"r_y2": 340.94,
"r_x3": 500.68,
"r_y3": 340.94,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.13,
"r_y0": 360.53,
"r_x1": 360.53,
"r_y1": 360.53,
"r_x2": 360.53,
"r_y2": 351.75,
"r_x3": 356.13,
"r_y3": 351.75,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.54,
"r_y0": 364.66,
"r_x1": 406.93,
"r_y1": 364.66,
"r_x2": 406.93,
"r_y2": 355.88,
"r_x3": 402.54,
"r_y3": 355.88,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.58,
"r_y0": 361.63,
"r_x1": 452.97,
"r_y1": 361.63,
"r_x2": 452.97,
"r_y2": 352.84,
"r_x3": 448.58,
"r_y3": 352.84,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.65,
"r_y0": 362.49,
"r_x1": 496.04,
"r_y1": 362.49,
"r_x2": 496.04,
"r_y2": 353.71,
"r_x3": 491.65,
"r_y3": 353.71,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.14,
"r_y0": 362.12,
"r_x1": 539.53,
"r_y1": 362.12,
"r_x2": 539.53,
"r_y2": 353.34,
"r_x3": 535.14,
"r_y3": 353.34,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.83,
"r_y0": 395.88,
"r_x1": 353.22,
"r_y1": 395.88,
"r_x2": 353.22,
"r_y2": 387.1,
"r_x3": 348.83,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.27,
"r_y0": 384.16,
"r_x1": 393.66,
"r_y1": 384.16,
"r_x2": 393.66,
"r_y2": 375.37,
"r_x3": 389.27,
"r_y3": 375.37,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.67,
"r_y0": 384.43,
"r_x1": 451.46,
"r_y1": 384.43,
"r_x2": 451.46,
"r_y2": 375.65,
"r_x3": 442.67,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.44,
"r_y0": 384.32,
"r_x1": 485.9,
"r_y1": 384.32,
"r_x2": 485.9,
"r_y2": 375.53,
"r_x3": 477.44,
"r_y3": 375.53,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.57,
"r_y0": 384.43,
"r_x1": 531.36,
"r_y1": 384.43,
"r_x2": 531.36,
"r_y2": 375.65,
"r_x3": 522.57,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.23,
"r_y0": 395.9,
"r_x1": 409.01,
"r_y1": 395.9,
"r_x2": 409.01,
"r_y2": 387.11,
"r_x3": 400.23,
"r_y3": 387.11,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 395.77,
"r_x1": 451.09,
"r_y1": 395.77,
"r_x2": 451.09,
"r_y2": 386.99,
"r_x3": 442.31,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.22,
"r_y0": 396.16,
"r_x1": 487.0,
"r_y1": 396.16,
"r_x2": 487.0,
"r_y2": 387.37,
"r_x3": 478.22,
"r_y3": 387.37,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.23,
"r_y0": 395.77,
"r_x1": 532.01,
"r_y1": 395.77,
"r_x2": 532.01,
"r_y2": 386.99,
"r_x3": 523.23,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.57,
"r_y0": 408.21,
"r_x1": 415.96,
"r_y1": 408.21,
"r_x2": 415.96,
"r_y2": 399.42,
"r_x3": 411.57,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.96,
"r_y0": 408.21,
"r_x1": 420.36,
"r_y1": 408.21,
"r_x2": 420.36,
"r_y2": 399.42,
"r_x3": 415.96,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 407.82,
"r_x1": 451.09,
"r_y1": 407.82,
"r_x2": 451.09,
"r_y2": 399.04,
"r_x3": 442.31,
"r_y3": 399.04,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.78,
"r_y0": 407.78,
"r_x1": 487.56,
"r_y1": 407.78,
"r_x2": 487.56,
"r_y2": 399.0,
"r_x3": 478.78,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.97,
"r_y0": 407.4,
"r_x1": 532.76,
"r_y1": 407.4,
"r_x2": 532.76,
"r_y2": 398.61,
"r_x3": 523.97,
"r_y3": 398.61,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.09,
"r_y0": 367.89,
"r_x1": 391.1,
"r_y1": 367.89,
"r_x2": 391.1,
"r_y2": 357.76,
"r_x3": 385.09,
"r_y3": 357.76,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.43,
"r_y0": 390.86,
"r_x1": 339.44,
"r_y1": 390.86,
"r_x2": 339.44,
"r_y2": 380.73,
"r_x3": 333.43,
"r_y3": 380.73,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.07,
"r_y0": 351.17,
"r_x1": 484.08,
"r_y1": 351.17,
"r_x2": 484.08,
"r_y2": 341.04,
"r_x3": 478.07,
"r_y3": 341.04,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 40,
"label": "text",
"bbox": {
"l": 408.15,
"t": 342.83,
"r": 412.54,
"b": 351.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.15,
"r_y0": 351.61,
"r_x1": 412.54,
"r_y1": 351.61,
"r_x2": 412.54,
"r_y2": 342.83,
"r_x3": 408.15,
"r_y3": 342.83,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 356.11,
"t": 341.57,
"r": 360.5,
"b": 350.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.11,
"r_y0": 350.36,
"r_x1": 360.5,
"r_y1": 350.36,
"r_x2": 360.5,
"r_y2": 341.57,
"r_x3": 356.11,
"r_y3": 341.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 500.68,
"t": 340.94,
"r": 505.07,
"b": 349.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.68,
"r_y0": 349.72,
"r_x1": 505.07,
"r_y1": 349.72,
"r_x2": 505.07,
"r_y2": 340.94,
"r_x3": 500.68,
"r_y3": 340.94,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 356.13,
"t": 351.75,
"r": 360.53,
"b": 360.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.13,
"r_y0": 360.53,
"r_x1": 360.53,
"r_y1": 360.53,
"r_x2": 360.53,
"r_y2": 351.75,
"r_x3": 356.13,
"r_y3": 351.75,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 402.54,
"t": 355.88,
"r": 406.93,
"b": 364.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.54,
"r_y0": 364.66,
"r_x1": 406.93,
"r_y1": 364.66,
"r_x2": 406.93,
"r_y2": 355.88,
"r_x3": 402.54,
"r_y3": 355.88,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 448.58,
"t": 352.84,
"r": 452.97,
"b": 361.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.58,
"r_y0": 361.63,
"r_x1": 452.97,
"r_y1": 361.63,
"r_x2": 452.97,
"r_y2": 352.84,
"r_x3": 448.58,
"r_y3": 352.84,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 491.65,
"t": 353.71,
"r": 496.04,
"b": 362.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.65,
"r_y0": 362.49,
"r_x1": 496.04,
"r_y1": 362.49,
"r_x2": 496.04,
"r_y2": 353.71,
"r_x3": 491.65,
"r_y3": 353.71,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 535.14,
"t": 353.34,
"r": 539.53,
"b": 362.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.14,
"r_y0": 362.12,
"r_x1": 539.53,
"r_y1": 362.12,
"r_x2": 539.53,
"r_y2": 353.34,
"r_x3": 535.14,
"r_y3": 353.34,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 348.83,
"t": 387.1,
"r": 353.22,
"b": 395.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.83,
"r_y0": 395.88,
"r_x1": 353.22,
"r_y1": 395.88,
"r_x2": 353.22,
"r_y2": 387.1,
"r_x3": 348.83,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 389.27,
"t": 375.37,
"r": 393.66,
"b": 384.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.27,
"r_y0": 384.16,
"r_x1": 393.66,
"r_y1": 384.16,
"r_x2": 393.66,
"r_y2": 375.37,
"r_x3": 389.27,
"r_y3": 375.37,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 442.67,
"t": 375.65,
"r": 451.46,
"b": 384.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.67,
"r_y0": 384.43,
"r_x1": 451.46,
"r_y1": 384.43,
"r_x2": 451.46,
"r_y2": 375.65,
"r_x3": 442.67,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 477.44,
"t": 375.53,
"r": 485.9,
"b": 384.32,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.44,
"r_y0": 384.32,
"r_x1": 485.9,
"r_y1": 384.32,
"r_x2": 485.9,
"r_y2": 375.53,
"r_x3": 477.44,
"r_y3": 375.53,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 522.57,
"t": 375.65,
"r": 531.36,
"b": 384.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.57,
"r_y0": 384.43,
"r_x1": 531.36,
"r_y1": 384.43,
"r_x2": 531.36,
"r_y2": 375.65,
"r_x3": 522.57,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 400.23,
"t": 387.11,
"r": 409.01,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.23,
"r_y0": 395.9,
"r_x1": 409.01,
"r_y1": 395.9,
"r_x2": 409.01,
"r_y2": 387.11,
"r_x3": 400.23,
"r_y3": 387.11,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 442.31,
"t": 386.99,
"r": 451.09,
"b": 395.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 395.77,
"r_x1": 451.09,
"r_y1": 395.77,
"r_x2": 451.09,
"r_y2": 386.99,
"r_x3": 442.31,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 478.22,
"t": 387.37,
"r": 487.0,
"b": 396.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.22,
"r_y0": 396.16,
"r_x1": 487.0,
"r_y1": 396.16,
"r_x2": 487.0,
"r_y2": 387.37,
"r_x3": 478.22,
"r_y3": 387.37,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 523.23,
"t": 386.99,
"r": 532.01,
"b": 395.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.23,
"r_y0": 395.77,
"r_x1": 532.01,
"r_y1": 395.77,
"r_x2": 532.01,
"r_y2": 386.99,
"r_x3": 523.23,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 411.57,
"t": 399.42,
"r": 415.96,
"b": 408.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.57,
"r_y0": 408.21,
"r_x1": 415.96,
"r_y1": 408.21,
"r_x2": 415.96,
"r_y2": 399.42,
"r_x3": 411.57,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 415.96,
"t": 399.42,
"r": 420.36,
"b": 408.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.96,
"r_y0": 408.21,
"r_x1": 420.36,
"r_y1": 408.21,
"r_x2": 420.36,
"r_y2": 399.42,
"r_x3": 415.96,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 442.31,
"t": 399.04,
"r": 451.09,
"b": 407.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 407.82,
"r_x1": 451.09,
"r_y1": 407.82,
"r_x2": 451.09,
"r_y2": 399.04,
"r_x3": 442.31,
"r_y3": 399.04,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 478.78,
"t": 399.0,
"r": 487.56,
"b": 407.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.78,
"r_y0": 407.78,
"r_x1": 487.56,
"r_y1": 407.78,
"r_x2": 487.56,
"r_y2": 399.0,
"r_x3": 478.78,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 523.97,
"t": 398.61,
"r": 532.76,
"b": 407.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.97,
"r_y0": 407.4,
"r_x1": 532.76,
"r_y1": 407.4,
"r_x2": 532.76,
"r_y2": 398.61,
"r_x3": 523.97,
"r_y3": 398.61,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 385.09,
"t": 357.76,
"r": 391.1,
"b": 367.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.09,
"r_y0": 367.89,
"r_x1": 391.1,
"r_y1": 367.89,
"r_x2": 391.1,
"r_y2": 357.76,
"r_x3": 385.09,
"r_y3": 357.76,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 333.43,
"t": 380.73,
"r": 339.44,
"b": 390.86,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.43,
"r_y0": 390.86,
"r_x1": 339.44,
"r_y1": 390.86,
"r_x2": 339.44,
"r_y2": 380.73,
"r_x3": 333.43,
"r_y3": 380.73,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 478.07,
"t": 341.04,
"r": 484.08,
"b": 351.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.07,
"r_y0": 351.17,
"r_x1": 484.08,
"r_y1": 351.17,
"r_x2": 484.08,
"r_y2": 341.04,
"r_x3": 478.07,
"r_y3": 341.04,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 23,
"label": "picture",
"bbox": {
"l": 315.72,
"t": 433.82,
"r": 536.84,
"b": 496.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.509,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.69,
"r": 398.5,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.25,
"t": 449.55,
"r": 351.64,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.32,
"r": 337.91,
"b": 483.45,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.88,
"t": 437.59,
"r": 465.88,
"b": 447.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 11,
"label": "table",
"bbox": {
"l": 315.72,
"t": 433.82,
"r": 536.84,
"b": 496.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.69,
"r": 398.5,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.25,
"t": 449.55,
"r": 351.64,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.32,
"r": 337.91,
"b": 483.45,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.88,
"t": 437.59,
"r": 465.88,
"b": 447.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 16,
"label": "picture",
"bbox": {
"l": 315.65,
"t": 228.72,
"r": 537.15,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.609,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.35,
"r": 337.2,
"b": 279.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.03,
"t": 252.68,
"r": 390.04,
"b": 262.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 15,
"label": "table",
"bbox": {
"l": 315.65,
"t": 228.72,
"r": 537.15,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.652,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.35,
"r": 337.2,
"b": 279.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.03,
"t": 252.68,
"r": 390.04,
"b": 262.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 6,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 514.5,
"r": 545.12,
"b": 559.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.921,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 523.41,
"r_x1": 345.73,
"r_y1": 523.41,
"r_x2": 345.73,
"r_y2": 514.5,
"r_x3": 308.86,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 1:",
"orig": "Figure 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 353.18,
"r_y0": 523.41,
"r_x1": 545.12,
"r_y1": 523.41,
"r_x2": 545.12,
"r_y2": 514.5,
"r_x3": 353.18,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table with subtle, complex features",
"orig": "Picture of a table with subtle, complex features",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 535.36,
"r_x1": 545.12,
"r_y1": 535.36,
"r_x2": 545.12,
"r_y2": 526.46,
"r_x3": 308.86,
"r_y3": 526.46,
"coord_origin": "TOPLEFT"
},
"text": "such as (1) multi-column headers, (2) cell with multi-row",
"orig": "such as (1) multi-column headers, (2) cell with multi-row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 547.32,
"r_x1": 545.12,
"r_y1": 547.32,
"r_x2": 545.12,
"r_y2": 538.41,
"r_x3": 308.86,
"r_y3": 538.41,
"coord_origin": "TOPLEFT"
},
"text": "text and (3) cells with no content. Image from PubTabNet",
"orig": "text and (3) cells with no content. Image from PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 559.27,
"r_x1": 505.69,
"r_y1": 559.27,
"r_x2": 505.69,
"r_y2": 550.37,
"r_x3": 308.86,
"r_y3": 550.37,
"coord_origin": "TOPLEFT"
},
"text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 584.41,
"r": 545.12,
"b": 665.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 593.32,
"r_x1": 545.11,
"r_y1": 593.32,
"r_x2": 545.11,
"r_y2": 584.41,
"r_x3": 320.82,
"r_y3": 584.41,
"coord_origin": "TOPLEFT"
},
"text": "Recently, significant progress has been made with vi-",
"orig": "Recently, significant progress has been made with vi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.27,
"r_x1": 545.12,
"r_y1": 605.27,
"r_x2": 545.12,
"r_y2": 596.36,
"r_x3": 308.86,
"r_y3": 596.36,
"coord_origin": "TOPLEFT"
},
"text": "sion based approaches to extract tables in documents. For",
"orig": "sion based approaches to extract tables in documents. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.23,
"r_x1": 545.12,
"r_y1": 617.23,
"r_x2": 545.12,
"r_y2": 608.32,
"r_x3": 308.86,
"r_y3": 608.32,
"coord_origin": "TOPLEFT"
},
"text": "the sake of completeness, the issue of table extraction from",
"orig": "the sake of completeness, the issue of table extraction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.18,
"r_x1": 545.12,
"r_y1": 629.18,
"r_x2": 545.12,
"r_y2": 620.27,
"r_x3": 308.86,
"r_y3": 620.27,
"coord_origin": "TOPLEFT"
},
"text": "documents is typically decomposed into two separate chal-",
"orig": "documents is typically decomposed into two separate chal-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.14,
"r_x1": 353.69,
"r_y1": 641.14,
"r_x2": 353.69,
"r_y2": 632.23,
"r_x3": 308.86,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "lenges, i.e.",
"orig": "lenges, i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 362.11,
"r_y0": 641.14,
"r_x1": 374.67,
"r_y1": 641.14,
"r_x2": 374.67,
"r_y2": 632.23,
"r_x3": 362.11,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.36,
"r_y0": 641.14,
"r_x1": 545.12,
"r_y1": 641.14,
"r_x2": 545.12,
"r_y2": 632.23,
"r_x3": 377.36,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "finding the location of the table(s) on a",
"orig": "finding the location of the table(s) on a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.09,
"r_x1": 545.12,
"r_y1": 653.09,
"r_x2": 545.12,
"r_y2": 644.19,
"r_x3": 308.86,
"r_y3": 644.19,
"coord_origin": "TOPLEFT"
},
"text": "document-page and (2) finding the structure of a given table",
"orig": "document-page and (2) finding the structure of a given table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.05,
"r_x1": 375.55,
"r_y1": 665.05,
"r_x2": 375.55,
"r_y2": 656.14,
"r_x3": 308.86,
"r_y3": 656.14,
"coord_origin": "TOPLEFT"
},
"text": "in the document.",
"orig": "in the document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 668.38,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 320.82,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "The first problem is called table-location and has been",
"orig": "The first problem is called table-location and has been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art object-detection networks (e.g. YOLO and later",
"orig": "of-the-art object-detection networks (e.g. YOLO and later",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.11,
"r_y1": 713.15,
"r_x2": 545.11,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "on Mask-RCNN [9]). For all practical purposes, it can be",
"orig": "on Mask-RCNN [9]). For all practical purposes, it can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.805,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "page_header",
"bbox": {
"l": 18.34,
"t": 207.82,
"r": 36.34,
"b": 560.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 18.34,
"r_y0": 560.0,
"r_x1": 36.34,
"r_y1": 560.0,
"r_x2": 36.34,
"r_y2": 207.82,
"r_x3": 18.34,
"r_y3": 207.82,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"11": {
"label": "table",
"id": 11,
"page_no": 0,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 315.72,
"t": 433.82,
"r": 536.84,
"b": 496.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.69,
"r": 398.5,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.25,
"t": 449.55,
"r": 351.64,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.32,
"r": 337.91,
"b": 483.45,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.88,
"t": 437.59,
"r": 465.88,
"b": 447.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"lcel",
"lcel",
"lcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 5,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 4,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 5,
"text": "1 2 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4 3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "8 2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "10",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "11",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "12",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "13",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "15",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "16",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "17",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "20",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
"15": {
"label": "table",
"id": 15,
"page_no": 0,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 315.65,
"t": 228.72,
"r": 537.15,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.652,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.35,
"r": 337.2,
"b": 279.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.03,
"t": 252.68,
"r": 390.04,
"b": 262.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 1,
"num_cols": 1,
"table_cells": [
{
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "1",
"column_header": true,
"row_header": false,
"row_section": false
}
]
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "section_header",
"id": 8,
"page_no": 0,
"cluster": {
"id": 8,
"label": "section_header",
"bbox": {
"l": 96.3,
"t": 107.03,
"r": 498.93,
"b": 119.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.887,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.3,
"r_y0": 119.93,
"r_x1": 498.93,
"r_y1": 119.93,
"r_x2": 498.93,
"r_y2": 107.03,
"r_x3": 96.3,
"r_y3": 107.03,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers.",
"orig": "TableFormer: Table Structure Understanding with Transformers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer: Table Structure Understanding with Transformers."
},
{
"label": "section_header",
"id": 13,
"page_no": 0,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 142.48,
"t": 146.69,
"r": 452.75,
"b": 171.32,
"coord_origin": "TOPLEFT"
},
"confidence": 0.759,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.48,
"r_y0": 157.37,
"r_x1": 452.75,
"r_y1": 157.37,
"r_x2": 452.75,
"r_y2": 146.69,
"r_x3": 142.48,
"r_y3": 146.69,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.92,
"r_y0": 171.32,
"r_x1": 332.31,
"r_y1": 171.32,
"r_x2": 332.31,
"r_y2": 160.63,
"r_x3": 262.92,
"r_y3": 160.63,
"coord_origin": "TOPLEFT"
},
"text": "IBM Research",
"orig": "IBM Research",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research"
},
{
"label": "key_value_region",
"id": 25,
"page_no": 0,
"cluster": {
"id": 25,
"label": "key_value_region",
"bbox": {
"l": 208.12,
"t": 175.96,
"r": 378.73,
"b": 184.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.485,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.12,
"r_y0": 184.43,
"r_x1": 212.73,
"r_y1": 184.43,
"r_x2": 212.73,
"r_y2": 175.96,
"r_x3": 208.12,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.73,
"r_y0": 184.0,
"r_x1": 293.43,
"r_y1": 184.0,
"r_x2": 293.43,
"r_y2": 177.08,
"r_x3": 212.73,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.43,
"r_y0": 184.43,
"r_x1": 298.04,
"r_y1": 184.43,
"r_x2": 298.04,
"r_y2": 175.96,
"r_x3": 293.43,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.03,
"r_y0": 184.0,
"r_x1": 378.73,
"r_y1": 184.0,
"r_x2": 378.73,
"r_y2": 177.08,
"r_x3": 298.03,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 7,
"label": "text",
"bbox": {
"l": 208.12,
"t": 175.96,
"r": 378.73,
"b": 184.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.12,
"r_y0": 184.43,
"r_x1": 212.73,
"r_y1": 184.43,
"r_x2": 212.73,
"r_y2": 175.96,
"r_x3": 208.12,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.73,
"r_y0": 184.0,
"r_x1": 293.43,
"r_y1": 184.0,
"r_x2": 293.43,
"r_y2": 177.08,
"r_x3": 212.73,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.43,
"r_y0": 184.43,
"r_x1": 298.04,
"r_y1": 184.43,
"r_x2": 298.04,
"r_y2": 175.96,
"r_x3": 293.43,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.03,
"r_y0": 184.0,
"r_x1": 378.73,
"r_y1": 184.0,
"r_x2": 378.73,
"r_y2": 177.08,
"r_x3": 298.03,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null
},
{
"label": "section_header",
"id": 5,
"page_no": 0,
"cluster": {
"id": 5,
"label": "section_header",
"bbox": {
"l": 145.99,
"t": 215.48,
"r": 190.48,
"b": 226.23,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.99,
"r_y0": 226.23,
"r_x1": 190.48,
"r_y1": 226.23,
"r_x2": 190.48,
"r_y2": 215.48,
"r_x3": 145.99,
"r_y3": 215.48,
"coord_origin": "TOPLEFT"
},
"text": "Abstract",
"orig": "Abstract",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Abstract"
},
{
"label": "text",
"id": 2,
"page_no": 0,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 241.4,
"r": 286.37,
"b": 513.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 249.98,
"r_x1": 286.36,
"r_y1": 249.98,
"r_x2": 286.36,
"r_y2": 241.4,
"r_x3": 62.07,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Tables organize valuable content in a concise and com-",
"orig": "Tables organize valuable content in a concise and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 261.94,
"r_x1": 286.37,
"r_y1": 261.94,
"r_x2": 286.37,
"r_y2": 253.35,
"r_x3": 50.11,
"r_y3": 253.35,
"coord_origin": "TOPLEFT"
},
"text": "pact representation. This content is extremely valuable for",
"orig": "pact representation. This content is extremely valuable for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 273.89,
"r_x1": 286.37,
"r_y1": 273.89,
"r_x2": 286.37,
"r_y2": 265.31,
"r_x3": 50.11,
"r_y3": 265.31,
"coord_origin": "TOPLEFT"
},
"text": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"orig": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 285.85,
"r_x1": 286.37,
"r_y1": 285.85,
"r_x2": 286.37,
"r_y2": 277.26,
"r_x3": 50.11,
"r_y3": 277.26,
"coord_origin": "TOPLEFT"
},
"text": "since they enhance their predictive capabilities. Unfortu-",
"orig": "since they enhance their predictive capabilities. Unfortu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 297.8,
"r_x1": 286.37,
"r_y1": 297.8,
"r_x2": 286.37,
"r_y2": 289.22,
"r_x3": 50.11,
"r_y3": 289.22,
"coord_origin": "TOPLEFT"
},
"text": "nately, tables come in a large variety of shapes and sizes.",
"orig": "nately, tables come in a large variety of shapes and sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 309.76,
"r_x1": 286.37,
"r_y1": 309.76,
"r_x2": 286.37,
"r_y2": 301.17,
"r_x3": 50.11,
"r_y3": 301.17,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, they can have complex column/row-header",
"orig": "Furthermore, they can have complex column/row-header",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 321.71,
"r_x1": 286.37,
"r_y1": 321.71,
"r_x2": 286.37,
"r_y2": 313.13,
"r_x3": 50.11,
"r_y3": 313.13,
"coord_origin": "TOPLEFT"
},
"text": "configurations, multiline rows, different variety of separa-",
"orig": "configurations, multiline rows, different variety of separa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 333.67,
"r_x1": 286.37,
"r_y1": 333.67,
"r_x2": 286.37,
"r_y2": 325.08,
"r_x3": 50.11,
"r_y3": 325.08,
"coord_origin": "TOPLEFT"
},
"text": "tion lines, missing entries, etc. As such, the correct iden-",
"orig": "tion lines, missing entries, etc. As such, the correct iden-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 345.62,
"r_x1": 286.37,
"r_y1": 345.62,
"r_x2": 286.37,
"r_y2": 337.04,
"r_x3": 50.11,
"r_y3": 337.04,
"coord_origin": "TOPLEFT"
},
"text": "tification of the table-structure from an image is a non-",
"orig": "tification of the table-structure from an image is a non-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 357.58,
"r_x1": 286.37,
"r_y1": 357.58,
"r_x2": 286.37,
"r_y2": 348.99,
"r_x3": 50.11,
"r_y3": 348.99,
"coord_origin": "TOPLEFT"
},
"text": "trivial task. In this paper, we present a new table-structure",
"orig": "trivial task. In this paper, we present a new table-structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 369.53,
"r_x1": 286.37,
"r_y1": 369.53,
"r_x2": 286.37,
"r_y2": 360.95,
"r_x3": 50.11,
"r_y3": 360.95,
"coord_origin": "TOPLEFT"
},
"text": "identification model. The latter improves the latest end-to-",
"orig": "identification model. The latter improves the latest end-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 381.49,
"r_x1": 286.37,
"r_y1": 381.49,
"r_x2": 286.37,
"r_y2": 372.9,
"r_x3": 50.11,
"r_y3": 372.9,
"coord_origin": "TOPLEFT"
},
"text": "end deep learning model (i.e. encoder-dual-decoder from",
"orig": "end deep learning model (i.e. encoder-dual-decoder from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 393.44,
"r_x1": 286.37,
"r_y1": 393.44,
"r_x2": 286.37,
"r_y2": 384.86,
"r_x3": 50.11,
"r_y3": 384.86,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet) in two significant ways. First, we introduce a",
"orig": "PubTabNet) in two significant ways. First, we introduce a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 405.4,
"r_x1": 286.37,
"r_y1": 405.4,
"r_x2": 286.37,
"r_y2": 396.81,
"r_x3": 50.11,
"r_y3": 396.81,
"coord_origin": "TOPLEFT"
},
"text": "new object detection decoder for table-cells. In this way,",
"orig": "new object detection decoder for table-cells. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 417.35,
"r_x1": 286.37,
"r_y1": 417.35,
"r_x2": 286.37,
"r_y2": 408.77,
"r_x3": 50.11,
"r_y3": 408.77,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the content of the table-cells from program-",
"orig": "we can obtain the content of the table-cells from program-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 429.31,
"r_x1": 286.37,
"r_y1": 429.31,
"r_x2": 286.37,
"r_y2": 420.72,
"r_x3": 50.11,
"r_y3": 420.72,
"coord_origin": "TOPLEFT"
},
"text": "matic PDF\u2019s directly from the PDF source and avoid the",
"orig": "matic PDF\u2019s directly from the PDF source and avoid the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 441.27,
"r_x1": 207.23,
"r_y1": 441.27,
"r_x2": 207.23,
"r_y2": 432.68,
"r_x3": 50.11,
"r_y3": 432.68,
"coord_origin": "TOPLEFT"
},
"text": "training of the custom OCR decoders.",
"orig": "training of the custom OCR decoders.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.1,
"r_y0": 441.27,
"r_x1": 286.37,
"r_y1": 441.27,
"r_x2": 286.37,
"r_y2": 432.68,
"r_x3": 214.1,
"r_y3": 432.68,
"coord_origin": "TOPLEFT"
},
"text": "This architectural",
"orig": "This architectural",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 453.22,
"r_x1": 286.37,
"r_y1": 453.22,
"r_x2": 286.37,
"r_y2": 444.63,
"r_x3": 50.11,
"r_y3": 444.63,
"coord_origin": "TOPLEFT"
},
"text": "change leads to more accurate table-content extraction and",
"orig": "change leads to more accurate table-content extraction and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 465.18,
"r_x1": 286.37,
"r_y1": 465.18,
"r_x2": 286.37,
"r_y2": 456.59,
"r_x3": 50.11,
"r_y3": 456.59,
"coord_origin": "TOPLEFT"
},
"text": "allows us to tackle non-english tables. Second, we replace",
"orig": "allows us to tackle non-english tables. Second, we replace",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 477.13,
"r_x1": 286.37,
"r_y1": 477.13,
"r_x2": 286.37,
"r_y2": 468.54,
"r_x3": 50.11,
"r_y3": 468.54,
"coord_origin": "TOPLEFT"
},
"text": "the LSTM decoders with transformer based decoders. This",
"orig": "the LSTM decoders with transformer based decoders. This",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 489.09,
"r_x1": 286.37,
"r_y1": 489.09,
"r_x2": 286.37,
"r_y2": 480.5,
"r_x3": 50.11,
"r_y3": 480.5,
"coord_origin": "TOPLEFT"
},
"text": "upgrade improves significantly the previous state-of-the-art",
"orig": "upgrade improves significantly the previous state-of-the-art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 501.04,
"r_x1": 286.37,
"r_y1": 501.04,
"r_x2": 286.37,
"r_y2": 492.45,
"r_x3": 50.11,
"r_y3": 492.45,
"coord_origin": "TOPLEFT"
},
"text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 513.0,
"r_x1": 276.65,
"r_y1": 513.0,
"r_x2": 276.65,
"r_y2": 504.41,
"r_x3": 50.11,
"r_y3": 504.41,
"coord_origin": "TOPLEFT"
},
"text": "simple tables and from 88.7% to 95% on complex tables.",
"orig": "simple tables and from 88.7% to 95% on complex tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables."
},
{
"label": "section_header",
"id": 4,
"page_no": 0,
"cluster": {
"id": 4,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 539.94,
"r": 126.95,
"b": 550.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.932,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 550.69,
"r_x1": 58.12,
"r_y1": 550.69,
"r_x2": 58.12,
"r_y2": 539.94,
"r_x3": 50.11,
"r_y3": 539.94,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.8,
"r_y0": 550.69,
"r_x1": 126.95,
"r_y1": 550.69,
"r_x2": 126.95,
"r_y2": 539.94,
"r_x3": 68.8,
"r_y3": 539.94,
"coord_origin": "TOPLEFT"
},
"text": "Introduction",
"orig": "Introduction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Introduction"
},
{
"label": "text",
"id": 1,
"page_no": 0,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 560.78,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 569.69,
"r_x1": 286.36,
"r_y1": 569.69,
"r_x2": 286.36,
"r_y2": 560.78,
"r_x3": 62.07,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "The occurrence of tables in documents is ubiquitous.",
"orig": "The occurrence of tables in documents is ubiquitous.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 581.64,
"r_x1": 286.37,
"r_y1": 581.64,
"r_x2": 286.37,
"r_y2": 572.74,
"r_x3": 50.11,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "They often summarise quantitative or factual data, which is",
"orig": "They often summarise quantitative or factual data, which is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 593.6,
"r_x1": 286.37,
"r_y1": 593.6,
"r_x2": 286.37,
"r_y2": 584.69,
"r_x3": 50.11,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "cumbersome to describe in verbose text but nevertheless ex-",
"orig": "cumbersome to describe in verbose text but nevertheless ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 605.56,
"r_x1": 286.37,
"r_y1": 605.56,
"r_x2": 286.37,
"r_y2": 596.65,
"r_x3": 50.11,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "tremely valuable. Unfortunately, this compact representa-",
"orig": "tremely valuable. Unfortunately, this compact representa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 617.51,
"r_x1": 286.37,
"r_y1": 617.51,
"r_x2": 286.37,
"r_y2": 608.6,
"r_x3": 50.11,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "tion is often not easy to parse by machines. There are many",
"orig": "tion is often not easy to parse by machines. There are many",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 629.47,
"r_x1": 286.37,
"r_y1": 629.47,
"r_x2": 286.37,
"r_y2": 620.56,
"r_x3": 50.11,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "implicit conventions used to obtain a compact table repre-",
"orig": "implicit conventions used to obtain a compact table repre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 641.42,
"r_x1": 286.37,
"r_y1": 641.42,
"r_x2": 286.37,
"r_y2": 632.51,
"r_x3": 50.11,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "sentation. For example, tables often have complex column-",
"orig": "sentation. For example, tables often have complex column-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "and row-headers in order to reduce duplicated cell content.",
"orig": "and row-headers in order to reduce duplicated cell content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 50.11,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "Lines of different shapes and sizes are leveraged to separate",
"orig": "Lines of different shapes and sizes are leveraged to separate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "content or indicate a tree structure. Additionally, tables can",
"orig": "content or indicate a tree structure. Additionally, tables can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "also have empty/missing table-entries or multi-row textual",
"orig": "also have empty/missing table-entries or multi-row textual",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "table-entries. Fig. 1 shows a table which presents all these",
"orig": "table-entries. Fig. 1 shows a table which presents all these",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 76.4,
"r_y1": 713.15,
"r_x2": 76.4,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "issues.",
"orig": "issues.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues."
},
{
"label": "section_header",
"id": 14,
"page_no": 0,
"cluster": {
"id": 14,
"label": "section_header",
"bbox": {
"l": 315.57,
"t": 218.01,
"r": 408.44,
"b": 226.75,
"coord_origin": "TOPLEFT"
},
"confidence": 0.672,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 226.75,
"r_x1": 324.01,
"r_y1": 226.75,
"r_x2": 324.01,
"r_y2": 218.01,
"r_x3": 315.57,
"r_y3": 218.01,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.23,
"r_y0": 226.75,
"r_x1": 408.44,
"r_y1": 226.75,
"r_x2": 408.44,
"r_y2": 218.01,
"r_x3": 328.23,
"r_y3": 218.01,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table:",
"orig": "Picture of a table:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "a. Picture of a table:"
},
{
"label": "list_item",
"id": 17,
"page_no": 0,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 315.57,
"t": 313.69,
"r": 486.4,
"b": 333.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.555,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 322.44,
"r_x1": 325.06,
"r_y1": 322.44,
"r_x2": 325.06,
"r_y2": 313.69,
"r_x3": 315.57,
"r_y3": 313.69,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.8,
"r_y0": 322.44,
"r_x1": 486.4,
"r_y1": 322.44,
"r_x2": 486.4,
"r_y2": 313.69,
"r_x3": 329.8,
"r_y3": 313.69,
"coord_origin": "TOPLEFT"
},
"text": "Red-annotation of bounding boxes,",
"orig": "Red-annotation of bounding boxes,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.46,
"r_y0": 333.24,
"r_x1": 472.47,
"r_y1": 333.24,
"r_x2": 472.47,
"r_y2": 324.49,
"r_x3": 326.46,
"r_y3": 324.49,
"coord_origin": "TOPLEFT"
},
"text": "Blue-predictions by TableFormer",
"orig": "Blue-predictions by TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer"
},
{
"label": "list_item",
"id": 18,
"page_no": 0,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 315.57,
"t": 420.18,
"r": 491.19,
"b": 428.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 428.93,
"r_x1": 324.81,
"r_y1": 428.93,
"r_x2": 324.81,
"r_y2": 420.18,
"r_x3": 315.57,
"r_y3": 420.18,
"coord_origin": "TOPLEFT"
},
"text": "c.",
"orig": "c.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.43,
"r_y0": 428.93,
"r_x1": 491.19,
"r_y1": 428.93,
"r_x2": 491.19,
"r_y2": 420.18,
"r_x3": 329.43,
"r_y3": 420.18,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer:",
"orig": "Structure predicted by TableFormer:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "c. Structure predicted by TableFormer:"
},
{
"label": "picture",
"id": 10,
"page_no": 0,
"cluster": {
"id": 10,
"label": "picture",
"bbox": {
"l": 314.78,
"t": 338.07,
"r": 539.18,
"b": 410.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.874,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.15,
"r_y0": 351.61,
"r_x1": 412.54,
"r_y1": 351.61,
"r_x2": 412.54,
"r_y2": 342.83,
"r_x3": 408.15,
"r_y3": 342.83,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.11,
"r_y0": 350.36,
"r_x1": 360.5,
"r_y1": 350.36,
"r_x2": 360.5,
"r_y2": 341.57,
"r_x3": 356.11,
"r_y3": 341.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.68,
"r_y0": 349.72,
"r_x1": 505.07,
"r_y1": 349.72,
"r_x2": 505.07,
"r_y2": 340.94,
"r_x3": 500.68,
"r_y3": 340.94,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.13,
"r_y0": 360.53,
"r_x1": 360.53,
"r_y1": 360.53,
"r_x2": 360.53,
"r_y2": 351.75,
"r_x3": 356.13,
"r_y3": 351.75,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.54,
"r_y0": 364.66,
"r_x1": 406.93,
"r_y1": 364.66,
"r_x2": 406.93,
"r_y2": 355.88,
"r_x3": 402.54,
"r_y3": 355.88,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.58,
"r_y0": 361.63,
"r_x1": 452.97,
"r_y1": 361.63,
"r_x2": 452.97,
"r_y2": 352.84,
"r_x3": 448.58,
"r_y3": 352.84,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.65,
"r_y0": 362.49,
"r_x1": 496.04,
"r_y1": 362.49,
"r_x2": 496.04,
"r_y2": 353.71,
"r_x3": 491.65,
"r_y3": 353.71,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.14,
"r_y0": 362.12,
"r_x1": 539.53,
"r_y1": 362.12,
"r_x2": 539.53,
"r_y2": 353.34,
"r_x3": 535.14,
"r_y3": 353.34,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.83,
"r_y0": 395.88,
"r_x1": 353.22,
"r_y1": 395.88,
"r_x2": 353.22,
"r_y2": 387.1,
"r_x3": 348.83,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.27,
"r_y0": 384.16,
"r_x1": 393.66,
"r_y1": 384.16,
"r_x2": 393.66,
"r_y2": 375.37,
"r_x3": 389.27,
"r_y3": 375.37,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.67,
"r_y0": 384.43,
"r_x1": 451.46,
"r_y1": 384.43,
"r_x2": 451.46,
"r_y2": 375.65,
"r_x3": 442.67,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.44,
"r_y0": 384.32,
"r_x1": 485.9,
"r_y1": 384.32,
"r_x2": 485.9,
"r_y2": 375.53,
"r_x3": 477.44,
"r_y3": 375.53,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.57,
"r_y0": 384.43,
"r_x1": 531.36,
"r_y1": 384.43,
"r_x2": 531.36,
"r_y2": 375.65,
"r_x3": 522.57,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.23,
"r_y0": 395.9,
"r_x1": 409.01,
"r_y1": 395.9,
"r_x2": 409.01,
"r_y2": 387.11,
"r_x3": 400.23,
"r_y3": 387.11,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 395.77,
"r_x1": 451.09,
"r_y1": 395.77,
"r_x2": 451.09,
"r_y2": 386.99,
"r_x3": 442.31,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.22,
"r_y0": 396.16,
"r_x1": 487.0,
"r_y1": 396.16,
"r_x2": 487.0,
"r_y2": 387.37,
"r_x3": 478.22,
"r_y3": 387.37,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.23,
"r_y0": 395.77,
"r_x1": 532.01,
"r_y1": 395.77,
"r_x2": 532.01,
"r_y2": 386.99,
"r_x3": 523.23,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.57,
"r_y0": 408.21,
"r_x1": 415.96,
"r_y1": 408.21,
"r_x2": 415.96,
"r_y2": 399.42,
"r_x3": 411.57,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.96,
"r_y0": 408.21,
"r_x1": 420.36,
"r_y1": 408.21,
"r_x2": 420.36,
"r_y2": 399.42,
"r_x3": 415.96,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 407.82,
"r_x1": 451.09,
"r_y1": 407.82,
"r_x2": 451.09,
"r_y2": 399.04,
"r_x3": 442.31,
"r_y3": 399.04,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.78,
"r_y0": 407.78,
"r_x1": 487.56,
"r_y1": 407.78,
"r_x2": 487.56,
"r_y2": 399.0,
"r_x3": 478.78,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.97,
"r_y0": 407.4,
"r_x1": 532.76,
"r_y1": 407.4,
"r_x2": 532.76,
"r_y2": 398.61,
"r_x3": 523.97,
"r_y3": 398.61,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.09,
"r_y0": 367.89,
"r_x1": 391.1,
"r_y1": 367.89,
"r_x2": 391.1,
"r_y2": 357.76,
"r_x3": 385.09,
"r_y3": 357.76,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.43,
"r_y0": 390.86,
"r_x1": 339.44,
"r_y1": 390.86,
"r_x2": 339.44,
"r_y2": 380.73,
"r_x3": 333.43,
"r_y3": 380.73,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.07,
"r_y0": 351.17,
"r_x1": 484.08,
"r_y1": 351.17,
"r_x2": 484.08,
"r_y2": 341.04,
"r_x3": 478.07,
"r_y3": 341.04,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 40,
"label": "text",
"bbox": {
"l": 408.15,
"t": 342.83,
"r": 412.54,
"b": 351.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.15,
"r_y0": 351.61,
"r_x1": 412.54,
"r_y1": 351.61,
"r_x2": 412.54,
"r_y2": 342.83,
"r_x3": 408.15,
"r_y3": 342.83,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 356.11,
"t": 341.57,
"r": 360.5,
"b": 350.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.11,
"r_y0": 350.36,
"r_x1": 360.5,
"r_y1": 350.36,
"r_x2": 360.5,
"r_y2": 341.57,
"r_x3": 356.11,
"r_y3": 341.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 500.68,
"t": 340.94,
"r": 505.07,
"b": 349.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.68,
"r_y0": 349.72,
"r_x1": 505.07,
"r_y1": 349.72,
"r_x2": 505.07,
"r_y2": 340.94,
"r_x3": 500.68,
"r_y3": 340.94,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 356.13,
"t": 351.75,
"r": 360.53,
"b": 360.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.13,
"r_y0": 360.53,
"r_x1": 360.53,
"r_y1": 360.53,
"r_x2": 360.53,
"r_y2": 351.75,
"r_x3": 356.13,
"r_y3": 351.75,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 402.54,
"t": 355.88,
"r": 406.93,
"b": 364.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.54,
"r_y0": 364.66,
"r_x1": 406.93,
"r_y1": 364.66,
"r_x2": 406.93,
"r_y2": 355.88,
"r_x3": 402.54,
"r_y3": 355.88,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 448.58,
"t": 352.84,
"r": 452.97,
"b": 361.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.58,
"r_y0": 361.63,
"r_x1": 452.97,
"r_y1": 361.63,
"r_x2": 452.97,
"r_y2": 352.84,
"r_x3": 448.58,
"r_y3": 352.84,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 491.65,
"t": 353.71,
"r": 496.04,
"b": 362.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.65,
"r_y0": 362.49,
"r_x1": 496.04,
"r_y1": 362.49,
"r_x2": 496.04,
"r_y2": 353.71,
"r_x3": 491.65,
"r_y3": 353.71,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 535.14,
"t": 353.34,
"r": 539.53,
"b": 362.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.14,
"r_y0": 362.12,
"r_x1": 539.53,
"r_y1": 362.12,
"r_x2": 539.53,
"r_y2": 353.34,
"r_x3": 535.14,
"r_y3": 353.34,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 348.83,
"t": 387.1,
"r": 353.22,
"b": 395.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.83,
"r_y0": 395.88,
"r_x1": 353.22,
"r_y1": 395.88,
"r_x2": 353.22,
"r_y2": 387.1,
"r_x3": 348.83,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 389.27,
"t": 375.37,
"r": 393.66,
"b": 384.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.27,
"r_y0": 384.16,
"r_x1": 393.66,
"r_y1": 384.16,
"r_x2": 393.66,
"r_y2": 375.37,
"r_x3": 389.27,
"r_y3": 375.37,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 442.67,
"t": 375.65,
"r": 451.46,
"b": 384.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.67,
"r_y0": 384.43,
"r_x1": 451.46,
"r_y1": 384.43,
"r_x2": 451.46,
"r_y2": 375.65,
"r_x3": 442.67,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 477.44,
"t": 375.53,
"r": 485.9,
"b": 384.32,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.44,
"r_y0": 384.32,
"r_x1": 485.9,
"r_y1": 384.32,
"r_x2": 485.9,
"r_y2": 375.53,
"r_x3": 477.44,
"r_y3": 375.53,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 522.57,
"t": 375.65,
"r": 531.36,
"b": 384.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.57,
"r_y0": 384.43,
"r_x1": 531.36,
"r_y1": 384.43,
"r_x2": 531.36,
"r_y2": 375.65,
"r_x3": 522.57,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 400.23,
"t": 387.11,
"r": 409.01,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.23,
"r_y0": 395.9,
"r_x1": 409.01,
"r_y1": 395.9,
"r_x2": 409.01,
"r_y2": 387.11,
"r_x3": 400.23,
"r_y3": 387.11,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 442.31,
"t": 386.99,
"r": 451.09,
"b": 395.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 395.77,
"r_x1": 451.09,
"r_y1": 395.77,
"r_x2": 451.09,
"r_y2": 386.99,
"r_x3": 442.31,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 478.22,
"t": 387.37,
"r": 487.0,
"b": 396.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.22,
"r_y0": 396.16,
"r_x1": 487.0,
"r_y1": 396.16,
"r_x2": 487.0,
"r_y2": 387.37,
"r_x3": 478.22,
"r_y3": 387.37,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 523.23,
"t": 386.99,
"r": 532.01,
"b": 395.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.23,
"r_y0": 395.77,
"r_x1": 532.01,
"r_y1": 395.77,
"r_x2": 532.01,
"r_y2": 386.99,
"r_x3": 523.23,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 411.57,
"t": 399.42,
"r": 415.96,
"b": 408.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.57,
"r_y0": 408.21,
"r_x1": 415.96,
"r_y1": 408.21,
"r_x2": 415.96,
"r_y2": 399.42,
"r_x3": 411.57,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 415.96,
"t": 399.42,
"r": 420.36,
"b": 408.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.96,
"r_y0": 408.21,
"r_x1": 420.36,
"r_y1": 408.21,
"r_x2": 420.36,
"r_y2": 399.42,
"r_x3": 415.96,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 442.31,
"t": 399.04,
"r": 451.09,
"b": 407.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 407.82,
"r_x1": 451.09,
"r_y1": 407.82,
"r_x2": 451.09,
"r_y2": 399.04,
"r_x3": 442.31,
"r_y3": 399.04,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 478.78,
"t": 399.0,
"r": 487.56,
"b": 407.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.78,
"r_y0": 407.78,
"r_x1": 487.56,
"r_y1": 407.78,
"r_x2": 487.56,
"r_y2": 399.0,
"r_x3": 478.78,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 523.97,
"t": 398.61,
"r": 532.76,
"b": 407.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.97,
"r_y0": 407.4,
"r_x1": 532.76,
"r_y1": 407.4,
"r_x2": 532.76,
"r_y2": 398.61,
"r_x3": 523.97,
"r_y3": 398.61,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 385.09,
"t": 357.76,
"r": 391.1,
"b": 367.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.09,
"r_y0": 367.89,
"r_x1": 391.1,
"r_y1": 367.89,
"r_x2": 391.1,
"r_y2": 357.76,
"r_x3": 385.09,
"r_y3": 357.76,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 333.43,
"t": 380.73,
"r": 339.44,
"b": 390.86,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.43,
"r_y0": 390.86,
"r_x1": 339.44,
"r_y1": 390.86,
"r_x2": 339.44,
"r_y2": 380.73,
"r_x3": 333.43,
"r_y3": 380.73,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 478.07,
"t": 341.04,
"r": 484.08,
"b": 351.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.07,
"r_y0": 351.17,
"r_x1": 484.08,
"r_y1": 351.17,
"r_x2": 484.08,
"r_y2": 341.04,
"r_x3": 478.07,
"r_y3": 341.04,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 23,
"page_no": 0,
"cluster": {
"id": 23,
"label": "picture",
"bbox": {
"l": 315.72,
"t": 433.82,
"r": 536.84,
"b": 496.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.509,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.69,
"r": 398.5,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.25,
"t": 449.55,
"r": 351.64,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.32,
"r": 337.91,
"b": 483.45,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.88,
"t": 437.59,
"r": 465.88,
"b": 447.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 11,
"page_no": 0,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 315.72,
"t": 433.82,
"r": 536.84,
"b": 496.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.69,
"r": 398.5,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.25,
"t": 449.55,
"r": 351.64,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.32,
"r": 337.91,
"b": 483.45,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.88,
"t": 437.59,
"r": 465.88,
"b": 447.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"lcel",
"lcel",
"lcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 5,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 4,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 5,
"text": "1 2 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4 3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "8 2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "10",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "11",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "12",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "13",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "15",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "16",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "17",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "20",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "picture",
"id": 16,
"page_no": 0,
"cluster": {
"id": 16,
"label": "picture",
"bbox": {
"l": 315.65,
"t": 228.72,
"r": 537.15,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.609,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.35,
"r": 337.2,
"b": 279.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.03,
"t": 252.68,
"r": 390.04,
"b": 262.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 15,
"page_no": 0,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 315.65,
"t": 228.72,
"r": 537.15,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.652,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.35,
"r": 337.2,
"b": 279.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.03,
"t": 252.68,
"r": 390.04,
"b": 262.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 1,
"num_cols": 1,
"table_cells": [
{
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "1",
"column_header": true,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 6,
"page_no": 0,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 514.5,
"r": 545.12,
"b": 559.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.921,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 523.41,
"r_x1": 345.73,
"r_y1": 523.41,
"r_x2": 345.73,
"r_y2": 514.5,
"r_x3": 308.86,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 1:",
"orig": "Figure 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 353.18,
"r_y0": 523.41,
"r_x1": 545.12,
"r_y1": 523.41,
"r_x2": 545.12,
"r_y2": 514.5,
"r_x3": 353.18,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table with subtle, complex features",
"orig": "Picture of a table with subtle, complex features",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 535.36,
"r_x1": 545.12,
"r_y1": 535.36,
"r_x2": 545.12,
"r_y2": 526.46,
"r_x3": 308.86,
"r_y3": 526.46,
"coord_origin": "TOPLEFT"
},
"text": "such as (1) multi-column headers, (2) cell with multi-row",
"orig": "such as (1) multi-column headers, (2) cell with multi-row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 547.32,
"r_x1": 545.12,
"r_y1": 547.32,
"r_x2": 545.12,
"r_y2": 538.41,
"r_x3": 308.86,
"r_y3": 538.41,
"coord_origin": "TOPLEFT"
},
"text": "text and (3) cells with no content. Image from PubTabNet",
"orig": "text and (3) cells with no content. Image from PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 559.27,
"r_x1": 505.69,
"r_y1": 559.27,
"r_x2": 505.69,
"r_y2": 550.37,
"r_x3": 308.86,
"r_y3": 550.37,
"coord_origin": "TOPLEFT"
},
"text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'."
},
{
"label": "text",
"id": 0,
"page_no": 0,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 584.41,
"r": 545.12,
"b": 665.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 593.32,
"r_x1": 545.11,
"r_y1": 593.32,
"r_x2": 545.11,
"r_y2": 584.41,
"r_x3": 320.82,
"r_y3": 584.41,
"coord_origin": "TOPLEFT"
},
"text": "Recently, significant progress has been made with vi-",
"orig": "Recently, significant progress has been made with vi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.27,
"r_x1": 545.12,
"r_y1": 605.27,
"r_x2": 545.12,
"r_y2": 596.36,
"r_x3": 308.86,
"r_y3": 596.36,
"coord_origin": "TOPLEFT"
},
"text": "sion based approaches to extract tables in documents. For",
"orig": "sion based approaches to extract tables in documents. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.23,
"r_x1": 545.12,
"r_y1": 617.23,
"r_x2": 545.12,
"r_y2": 608.32,
"r_x3": 308.86,
"r_y3": 608.32,
"coord_origin": "TOPLEFT"
},
"text": "the sake of completeness, the issue of table extraction from",
"orig": "the sake of completeness, the issue of table extraction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.18,
"r_x1": 545.12,
"r_y1": 629.18,
"r_x2": 545.12,
"r_y2": 620.27,
"r_x3": 308.86,
"r_y3": 620.27,
"coord_origin": "TOPLEFT"
},
"text": "documents is typically decomposed into two separate chal-",
"orig": "documents is typically decomposed into two separate chal-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.14,
"r_x1": 353.69,
"r_y1": 641.14,
"r_x2": 353.69,
"r_y2": 632.23,
"r_x3": 308.86,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "lenges, i.e.",
"orig": "lenges, i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 362.11,
"r_y0": 641.14,
"r_x1": 374.67,
"r_y1": 641.14,
"r_x2": 374.67,
"r_y2": 632.23,
"r_x3": 362.11,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.36,
"r_y0": 641.14,
"r_x1": 545.12,
"r_y1": 641.14,
"r_x2": 545.12,
"r_y2": 632.23,
"r_x3": 377.36,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "finding the location of the table(s) on a",
"orig": "finding the location of the table(s) on a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.09,
"r_x1": 545.12,
"r_y1": 653.09,
"r_x2": 545.12,
"r_y2": 644.19,
"r_x3": 308.86,
"r_y3": 644.19,
"coord_origin": "TOPLEFT"
},
"text": "document-page and (2) finding the structure of a given table",
"orig": "document-page and (2) finding the structure of a given table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.05,
"r_x1": 375.55,
"r_y1": 665.05,
"r_x2": 375.55,
"r_y2": 656.14,
"r_x3": 308.86,
"r_y3": 656.14,
"coord_origin": "TOPLEFT"
},
"text": "in the document.",
"orig": "in the document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document."
},
{
"label": "text",
"id": 3,
"page_no": 0,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 668.38,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 320.82,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "The first problem is called table-location and has been",
"orig": "The first problem is called table-location and has been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art object-detection networks (e.g. YOLO and later",
"orig": "of-the-art object-detection networks (e.g. YOLO and later",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.11,
"r_y1": 713.15,
"r_x2": 545.11,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "on Mask-RCNN [9]). For all practical purposes, it can be",
"orig": "on Mask-RCNN [9]). For all practical purposes, it can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be"
},
{
"label": "page_footer",
"id": 12,
"page_no": 0,
"cluster": {
"id": 12,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.805,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1"
},
{
"label": "page_header",
"id": 9,
"page_no": 0,
"cluster": {
"id": 9,
"label": "page_header",
"bbox": {
"l": 18.34,
"t": 207.82,
"r": 36.34,
"b": 560.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 18.34,
"r_y0": 560.0,
"r_x1": 36.34,
"r_y1": 560.0,
"r_x2": 36.34,
"r_y2": 207.82,
"r_x3": 18.34,
"r_y3": 207.82,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022"
}
],
"body": [
{
"label": "section_header",
"id": 8,
"page_no": 0,
"cluster": {
"id": 8,
"label": "section_header",
"bbox": {
"l": 96.3,
"t": 107.03,
"r": 498.93,
"b": 119.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.887,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.3,
"r_y0": 119.93,
"r_x1": 498.93,
"r_y1": 119.93,
"r_x2": 498.93,
"r_y2": 107.03,
"r_x3": 96.3,
"r_y3": 107.03,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers.",
"orig": "TableFormer: Table Structure Understanding with Transformers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer: Table Structure Understanding with Transformers."
},
{
"label": "section_header",
"id": 13,
"page_no": 0,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 142.48,
"t": 146.69,
"r": 452.75,
"b": 171.32,
"coord_origin": "TOPLEFT"
},
"confidence": 0.759,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.48,
"r_y0": 157.37,
"r_x1": 452.75,
"r_y1": 157.37,
"r_x2": 452.75,
"r_y2": 146.69,
"r_x3": 142.48,
"r_y3": 146.69,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.92,
"r_y0": 171.32,
"r_x1": 332.31,
"r_y1": 171.32,
"r_x2": 332.31,
"r_y2": 160.63,
"r_x3": 262.92,
"r_y3": 160.63,
"coord_origin": "TOPLEFT"
},
"text": "IBM Research",
"orig": "IBM Research",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research"
},
{
"label": "key_value_region",
"id": 25,
"page_no": 0,
"cluster": {
"id": 25,
"label": "key_value_region",
"bbox": {
"l": 208.12,
"t": 175.96,
"r": 378.73,
"b": 184.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.485,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.12,
"r_y0": 184.43,
"r_x1": 212.73,
"r_y1": 184.43,
"r_x2": 212.73,
"r_y2": 175.96,
"r_x3": 208.12,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.73,
"r_y0": 184.0,
"r_x1": 293.43,
"r_y1": 184.0,
"r_x2": 293.43,
"r_y2": 177.08,
"r_x3": 212.73,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.43,
"r_y0": 184.43,
"r_x1": 298.04,
"r_y1": 184.43,
"r_x2": 298.04,
"r_y2": 175.96,
"r_x3": 293.43,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.03,
"r_y0": 184.0,
"r_x1": 378.73,
"r_y1": 184.0,
"r_x2": 378.73,
"r_y2": 177.08,
"r_x3": 298.03,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 7,
"label": "text",
"bbox": {
"l": 208.12,
"t": 175.96,
"r": 378.73,
"b": 184.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.12,
"r_y0": 184.43,
"r_x1": 212.73,
"r_y1": 184.43,
"r_x2": 212.73,
"r_y2": 175.96,
"r_x3": 208.12,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.73,
"r_y0": 184.0,
"r_x1": 293.43,
"r_y1": 184.0,
"r_x2": 293.43,
"r_y2": 177.08,
"r_x3": 212.73,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.43,
"r_y0": 184.43,
"r_x1": 298.04,
"r_y1": 184.43,
"r_x2": 298.04,
"r_y2": 175.96,
"r_x3": 293.43,
"r_y3": 175.96,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.03,
"r_y0": 184.0,
"r_x1": 378.73,
"r_y1": 184.0,
"r_x2": 378.73,
"r_y2": 177.08,
"r_x3": 298.03,
"r_y3": 177.08,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null
},
{
"label": "section_header",
"id": 5,
"page_no": 0,
"cluster": {
"id": 5,
"label": "section_header",
"bbox": {
"l": 145.99,
"t": 215.48,
"r": 190.48,
"b": 226.23,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.99,
"r_y0": 226.23,
"r_x1": 190.48,
"r_y1": 226.23,
"r_x2": 190.48,
"r_y2": 215.48,
"r_x3": 145.99,
"r_y3": 215.48,
"coord_origin": "TOPLEFT"
},
"text": "Abstract",
"orig": "Abstract",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Abstract"
},
{
"label": "text",
"id": 2,
"page_no": 0,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 241.4,
"r": 286.37,
"b": 513.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 249.98,
"r_x1": 286.36,
"r_y1": 249.98,
"r_x2": 286.36,
"r_y2": 241.4,
"r_x3": 62.07,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Tables organize valuable content in a concise and com-",
"orig": "Tables organize valuable content in a concise and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 261.94,
"r_x1": 286.37,
"r_y1": 261.94,
"r_x2": 286.37,
"r_y2": 253.35,
"r_x3": 50.11,
"r_y3": 253.35,
"coord_origin": "TOPLEFT"
},
"text": "pact representation. This content is extremely valuable for",
"orig": "pact representation. This content is extremely valuable for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 273.89,
"r_x1": 286.37,
"r_y1": 273.89,
"r_x2": 286.37,
"r_y2": 265.31,
"r_x3": 50.11,
"r_y3": 265.31,
"coord_origin": "TOPLEFT"
},
"text": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"orig": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 285.85,
"r_x1": 286.37,
"r_y1": 285.85,
"r_x2": 286.37,
"r_y2": 277.26,
"r_x3": 50.11,
"r_y3": 277.26,
"coord_origin": "TOPLEFT"
},
"text": "since they enhance their predictive capabilities. Unfortu-",
"orig": "since they enhance their predictive capabilities. Unfortu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 297.8,
"r_x1": 286.37,
"r_y1": 297.8,
"r_x2": 286.37,
"r_y2": 289.22,
"r_x3": 50.11,
"r_y3": 289.22,
"coord_origin": "TOPLEFT"
},
"text": "nately, tables come in a large variety of shapes and sizes.",
"orig": "nately, tables come in a large variety of shapes and sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 309.76,
"r_x1": 286.37,
"r_y1": 309.76,
"r_x2": 286.37,
"r_y2": 301.17,
"r_x3": 50.11,
"r_y3": 301.17,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, they can have complex column/row-header",
"orig": "Furthermore, they can have complex column/row-header",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 321.71,
"r_x1": 286.37,
"r_y1": 321.71,
"r_x2": 286.37,
"r_y2": 313.13,
"r_x3": 50.11,
"r_y3": 313.13,
"coord_origin": "TOPLEFT"
},
"text": "configurations, multiline rows, different variety of separa-",
"orig": "configurations, multiline rows, different variety of separa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 333.67,
"r_x1": 286.37,
"r_y1": 333.67,
"r_x2": 286.37,
"r_y2": 325.08,
"r_x3": 50.11,
"r_y3": 325.08,
"coord_origin": "TOPLEFT"
},
"text": "tion lines, missing entries, etc. As such, the correct iden-",
"orig": "tion lines, missing entries, etc. As such, the correct iden-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 345.62,
"r_x1": 286.37,
"r_y1": 345.62,
"r_x2": 286.37,
"r_y2": 337.04,
"r_x3": 50.11,
"r_y3": 337.04,
"coord_origin": "TOPLEFT"
},
"text": "tification of the table-structure from an image is a non-",
"orig": "tification of the table-structure from an image is a non-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 357.58,
"r_x1": 286.37,
"r_y1": 357.58,
"r_x2": 286.37,
"r_y2": 348.99,
"r_x3": 50.11,
"r_y3": 348.99,
"coord_origin": "TOPLEFT"
},
"text": "trivial task. In this paper, we present a new table-structure",
"orig": "trivial task. In this paper, we present a new table-structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 369.53,
"r_x1": 286.37,
"r_y1": 369.53,
"r_x2": 286.37,
"r_y2": 360.95,
"r_x3": 50.11,
"r_y3": 360.95,
"coord_origin": "TOPLEFT"
},
"text": "identification model. The latter improves the latest end-to-",
"orig": "identification model. The latter improves the latest end-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 381.49,
"r_x1": 286.37,
"r_y1": 381.49,
"r_x2": 286.37,
"r_y2": 372.9,
"r_x3": 50.11,
"r_y3": 372.9,
"coord_origin": "TOPLEFT"
},
"text": "end deep learning model (i.e. encoder-dual-decoder from",
"orig": "end deep learning model (i.e. encoder-dual-decoder from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 393.44,
"r_x1": 286.37,
"r_y1": 393.44,
"r_x2": 286.37,
"r_y2": 384.86,
"r_x3": 50.11,
"r_y3": 384.86,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet) in two significant ways. First, we introduce a",
"orig": "PubTabNet) in two significant ways. First, we introduce a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 405.4,
"r_x1": 286.37,
"r_y1": 405.4,
"r_x2": 286.37,
"r_y2": 396.81,
"r_x3": 50.11,
"r_y3": 396.81,
"coord_origin": "TOPLEFT"
},
"text": "new object detection decoder for table-cells. In this way,",
"orig": "new object detection decoder for table-cells. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 417.35,
"r_x1": 286.37,
"r_y1": 417.35,
"r_x2": 286.37,
"r_y2": 408.77,
"r_x3": 50.11,
"r_y3": 408.77,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the content of the table-cells from program-",
"orig": "we can obtain the content of the table-cells from program-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 429.31,
"r_x1": 286.37,
"r_y1": 429.31,
"r_x2": 286.37,
"r_y2": 420.72,
"r_x3": 50.11,
"r_y3": 420.72,
"coord_origin": "TOPLEFT"
},
"text": "matic PDF\u2019s directly from the PDF source and avoid the",
"orig": "matic PDF\u2019s directly from the PDF source and avoid the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 441.27,
"r_x1": 207.23,
"r_y1": 441.27,
"r_x2": 207.23,
"r_y2": 432.68,
"r_x3": 50.11,
"r_y3": 432.68,
"coord_origin": "TOPLEFT"
},
"text": "training of the custom OCR decoders.",
"orig": "training of the custom OCR decoders.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.1,
"r_y0": 441.27,
"r_x1": 286.37,
"r_y1": 441.27,
"r_x2": 286.37,
"r_y2": 432.68,
"r_x3": 214.1,
"r_y3": 432.68,
"coord_origin": "TOPLEFT"
},
"text": "This architectural",
"orig": "This architectural",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 453.22,
"r_x1": 286.37,
"r_y1": 453.22,
"r_x2": 286.37,
"r_y2": 444.63,
"r_x3": 50.11,
"r_y3": 444.63,
"coord_origin": "TOPLEFT"
},
"text": "change leads to more accurate table-content extraction and",
"orig": "change leads to more accurate table-content extraction and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 465.18,
"r_x1": 286.37,
"r_y1": 465.18,
"r_x2": 286.37,
"r_y2": 456.59,
"r_x3": 50.11,
"r_y3": 456.59,
"coord_origin": "TOPLEFT"
},
"text": "allows us to tackle non-english tables. Second, we replace",
"orig": "allows us to tackle non-english tables. Second, we replace",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 477.13,
"r_x1": 286.37,
"r_y1": 477.13,
"r_x2": 286.37,
"r_y2": 468.54,
"r_x3": 50.11,
"r_y3": 468.54,
"coord_origin": "TOPLEFT"
},
"text": "the LSTM decoders with transformer based decoders. This",
"orig": "the LSTM decoders with transformer based decoders. This",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 489.09,
"r_x1": 286.37,
"r_y1": 489.09,
"r_x2": 286.37,
"r_y2": 480.5,
"r_x3": 50.11,
"r_y3": 480.5,
"coord_origin": "TOPLEFT"
},
"text": "upgrade improves significantly the previous state-of-the-art",
"orig": "upgrade improves significantly the previous state-of-the-art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 501.04,
"r_x1": 286.37,
"r_y1": 501.04,
"r_x2": 286.37,
"r_y2": 492.45,
"r_x3": 50.11,
"r_y3": 492.45,
"coord_origin": "TOPLEFT"
},
"text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 513.0,
"r_x1": 276.65,
"r_y1": 513.0,
"r_x2": 276.65,
"r_y2": 504.41,
"r_x3": 50.11,
"r_y3": 504.41,
"coord_origin": "TOPLEFT"
},
"text": "simple tables and from 88.7% to 95% on complex tables.",
"orig": "simple tables and from 88.7% to 95% on complex tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables."
},
{
"label": "section_header",
"id": 4,
"page_no": 0,
"cluster": {
"id": 4,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 539.94,
"r": 126.95,
"b": 550.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.932,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 550.69,
"r_x1": 58.12,
"r_y1": 550.69,
"r_x2": 58.12,
"r_y2": 539.94,
"r_x3": 50.11,
"r_y3": 539.94,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.8,
"r_y0": 550.69,
"r_x1": 126.95,
"r_y1": 550.69,
"r_x2": 126.95,
"r_y2": 539.94,
"r_x3": 68.8,
"r_y3": 539.94,
"coord_origin": "TOPLEFT"
},
"text": "Introduction",
"orig": "Introduction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Introduction"
},
{
"label": "text",
"id": 1,
"page_no": 0,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 560.78,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 569.69,
"r_x1": 286.36,
"r_y1": 569.69,
"r_x2": 286.36,
"r_y2": 560.78,
"r_x3": 62.07,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "The occurrence of tables in documents is ubiquitous.",
"orig": "The occurrence of tables in documents is ubiquitous.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 581.64,
"r_x1": 286.37,
"r_y1": 581.64,
"r_x2": 286.37,
"r_y2": 572.74,
"r_x3": 50.11,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "They often summarise quantitative or factual data, which is",
"orig": "They often summarise quantitative or factual data, which is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 593.6,
"r_x1": 286.37,
"r_y1": 593.6,
"r_x2": 286.37,
"r_y2": 584.69,
"r_x3": 50.11,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "cumbersome to describe in verbose text but nevertheless ex-",
"orig": "cumbersome to describe in verbose text but nevertheless ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 605.56,
"r_x1": 286.37,
"r_y1": 605.56,
"r_x2": 286.37,
"r_y2": 596.65,
"r_x3": 50.11,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "tremely valuable. Unfortunately, this compact representa-",
"orig": "tremely valuable. Unfortunately, this compact representa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 617.51,
"r_x1": 286.37,
"r_y1": 617.51,
"r_x2": 286.37,
"r_y2": 608.6,
"r_x3": 50.11,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "tion is often not easy to parse by machines. There are many",
"orig": "tion is often not easy to parse by machines. There are many",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 629.47,
"r_x1": 286.37,
"r_y1": 629.47,
"r_x2": 286.37,
"r_y2": 620.56,
"r_x3": 50.11,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "implicit conventions used to obtain a compact table repre-",
"orig": "implicit conventions used to obtain a compact table repre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 641.42,
"r_x1": 286.37,
"r_y1": 641.42,
"r_x2": 286.37,
"r_y2": 632.51,
"r_x3": 50.11,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "sentation. For example, tables often have complex column-",
"orig": "sentation. For example, tables often have complex column-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "and row-headers in order to reduce duplicated cell content.",
"orig": "and row-headers in order to reduce duplicated cell content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 50.11,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "Lines of different shapes and sizes are leveraged to separate",
"orig": "Lines of different shapes and sizes are leveraged to separate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "content or indicate a tree structure. Additionally, tables can",
"orig": "content or indicate a tree structure. Additionally, tables can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "also have empty/missing table-entries or multi-row textual",
"orig": "also have empty/missing table-entries or multi-row textual",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "table-entries. Fig. 1 shows a table which presents all these",
"orig": "table-entries. Fig. 1 shows a table which presents all these",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 76.4,
"r_y1": 713.15,
"r_x2": 76.4,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "issues.",
"orig": "issues.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues."
},
{
"label": "section_header",
"id": 14,
"page_no": 0,
"cluster": {
"id": 14,
"label": "section_header",
"bbox": {
"l": 315.57,
"t": 218.01,
"r": 408.44,
"b": 226.75,
"coord_origin": "TOPLEFT"
},
"confidence": 0.672,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 226.75,
"r_x1": 324.01,
"r_y1": 226.75,
"r_x2": 324.01,
"r_y2": 218.01,
"r_x3": 315.57,
"r_y3": 218.01,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.23,
"r_y0": 226.75,
"r_x1": 408.44,
"r_y1": 226.75,
"r_x2": 408.44,
"r_y2": 218.01,
"r_x3": 328.23,
"r_y3": 218.01,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table:",
"orig": "Picture of a table:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "a. Picture of a table:"
},
{
"label": "list_item",
"id": 17,
"page_no": 0,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 315.57,
"t": 313.69,
"r": 486.4,
"b": 333.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.555,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 322.44,
"r_x1": 325.06,
"r_y1": 322.44,
"r_x2": 325.06,
"r_y2": 313.69,
"r_x3": 315.57,
"r_y3": 313.69,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.8,
"r_y0": 322.44,
"r_x1": 486.4,
"r_y1": 322.44,
"r_x2": 486.4,
"r_y2": 313.69,
"r_x3": 329.8,
"r_y3": 313.69,
"coord_origin": "TOPLEFT"
},
"text": "Red-annotation of bounding boxes,",
"orig": "Red-annotation of bounding boxes,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.46,
"r_y0": 333.24,
"r_x1": 472.47,
"r_y1": 333.24,
"r_x2": 472.47,
"r_y2": 324.49,
"r_x3": 326.46,
"r_y3": 324.49,
"coord_origin": "TOPLEFT"
},
"text": "Blue-predictions by TableFormer",
"orig": "Blue-predictions by TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer"
},
{
"label": "list_item",
"id": 18,
"page_no": 0,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 315.57,
"t": 420.18,
"r": 491.19,
"b": 428.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.57,
"r_y0": 428.93,
"r_x1": 324.81,
"r_y1": 428.93,
"r_x2": 324.81,
"r_y2": 420.18,
"r_x3": 315.57,
"r_y3": 420.18,
"coord_origin": "TOPLEFT"
},
"text": "c.",
"orig": "c.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.43,
"r_y0": 428.93,
"r_x1": 491.19,
"r_y1": 428.93,
"r_x2": 491.19,
"r_y2": 420.18,
"r_x3": 329.43,
"r_y3": 420.18,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer:",
"orig": "Structure predicted by TableFormer:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "c. Structure predicted by TableFormer:"
},
{
"label": "picture",
"id": 10,
"page_no": 0,
"cluster": {
"id": 10,
"label": "picture",
"bbox": {
"l": 314.78,
"t": 338.07,
"r": 539.18,
"b": 410.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.874,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.15,
"r_y0": 351.61,
"r_x1": 412.54,
"r_y1": 351.61,
"r_x2": 412.54,
"r_y2": 342.83,
"r_x3": 408.15,
"r_y3": 342.83,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.11,
"r_y0": 350.36,
"r_x1": 360.5,
"r_y1": 350.36,
"r_x2": 360.5,
"r_y2": 341.57,
"r_x3": 356.11,
"r_y3": 341.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.68,
"r_y0": 349.72,
"r_x1": 505.07,
"r_y1": 349.72,
"r_x2": 505.07,
"r_y2": 340.94,
"r_x3": 500.68,
"r_y3": 340.94,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.13,
"r_y0": 360.53,
"r_x1": 360.53,
"r_y1": 360.53,
"r_x2": 360.53,
"r_y2": 351.75,
"r_x3": 356.13,
"r_y3": 351.75,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.54,
"r_y0": 364.66,
"r_x1": 406.93,
"r_y1": 364.66,
"r_x2": 406.93,
"r_y2": 355.88,
"r_x3": 402.54,
"r_y3": 355.88,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.58,
"r_y0": 361.63,
"r_x1": 452.97,
"r_y1": 361.63,
"r_x2": 452.97,
"r_y2": 352.84,
"r_x3": 448.58,
"r_y3": 352.84,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.65,
"r_y0": 362.49,
"r_x1": 496.04,
"r_y1": 362.49,
"r_x2": 496.04,
"r_y2": 353.71,
"r_x3": 491.65,
"r_y3": 353.71,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.14,
"r_y0": 362.12,
"r_x1": 539.53,
"r_y1": 362.12,
"r_x2": 539.53,
"r_y2": 353.34,
"r_x3": 535.14,
"r_y3": 353.34,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.83,
"r_y0": 395.88,
"r_x1": 353.22,
"r_y1": 395.88,
"r_x2": 353.22,
"r_y2": 387.1,
"r_x3": 348.83,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.27,
"r_y0": 384.16,
"r_x1": 393.66,
"r_y1": 384.16,
"r_x2": 393.66,
"r_y2": 375.37,
"r_x3": 389.27,
"r_y3": 375.37,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.67,
"r_y0": 384.43,
"r_x1": 451.46,
"r_y1": 384.43,
"r_x2": 451.46,
"r_y2": 375.65,
"r_x3": 442.67,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.44,
"r_y0": 384.32,
"r_x1": 485.9,
"r_y1": 384.32,
"r_x2": 485.9,
"r_y2": 375.53,
"r_x3": 477.44,
"r_y3": 375.53,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.57,
"r_y0": 384.43,
"r_x1": 531.36,
"r_y1": 384.43,
"r_x2": 531.36,
"r_y2": 375.65,
"r_x3": 522.57,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.23,
"r_y0": 395.9,
"r_x1": 409.01,
"r_y1": 395.9,
"r_x2": 409.01,
"r_y2": 387.11,
"r_x3": 400.23,
"r_y3": 387.11,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 395.77,
"r_x1": 451.09,
"r_y1": 395.77,
"r_x2": 451.09,
"r_y2": 386.99,
"r_x3": 442.31,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.22,
"r_y0": 396.16,
"r_x1": 487.0,
"r_y1": 396.16,
"r_x2": 487.0,
"r_y2": 387.37,
"r_x3": 478.22,
"r_y3": 387.37,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.23,
"r_y0": 395.77,
"r_x1": 532.01,
"r_y1": 395.77,
"r_x2": 532.01,
"r_y2": 386.99,
"r_x3": 523.23,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.57,
"r_y0": 408.21,
"r_x1": 415.96,
"r_y1": 408.21,
"r_x2": 415.96,
"r_y2": 399.42,
"r_x3": 411.57,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.96,
"r_y0": 408.21,
"r_x1": 420.36,
"r_y1": 408.21,
"r_x2": 420.36,
"r_y2": 399.42,
"r_x3": 415.96,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 407.82,
"r_x1": 451.09,
"r_y1": 407.82,
"r_x2": 451.09,
"r_y2": 399.04,
"r_x3": 442.31,
"r_y3": 399.04,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.78,
"r_y0": 407.78,
"r_x1": 487.56,
"r_y1": 407.78,
"r_x2": 487.56,
"r_y2": 399.0,
"r_x3": 478.78,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.97,
"r_y0": 407.4,
"r_x1": 532.76,
"r_y1": 407.4,
"r_x2": 532.76,
"r_y2": 398.61,
"r_x3": 523.97,
"r_y3": 398.61,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.09,
"r_y0": 367.89,
"r_x1": 391.1,
"r_y1": 367.89,
"r_x2": 391.1,
"r_y2": 357.76,
"r_x3": 385.09,
"r_y3": 357.76,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.43,
"r_y0": 390.86,
"r_x1": 339.44,
"r_y1": 390.86,
"r_x2": 339.44,
"r_y2": 380.73,
"r_x3": 333.43,
"r_y3": 380.73,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.07,
"r_y0": 351.17,
"r_x1": 484.08,
"r_y1": 351.17,
"r_x2": 484.08,
"r_y2": 341.04,
"r_x3": 478.07,
"r_y3": 341.04,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 40,
"label": "text",
"bbox": {
"l": 408.15,
"t": 342.83,
"r": 412.54,
"b": 351.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.15,
"r_y0": 351.61,
"r_x1": 412.54,
"r_y1": 351.61,
"r_x2": 412.54,
"r_y2": 342.83,
"r_x3": 408.15,
"r_y3": 342.83,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 356.11,
"t": 341.57,
"r": 360.5,
"b": 350.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.11,
"r_y0": 350.36,
"r_x1": 360.5,
"r_y1": 350.36,
"r_x2": 360.5,
"r_y2": 341.57,
"r_x3": 356.11,
"r_y3": 341.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 500.68,
"t": 340.94,
"r": 505.07,
"b": 349.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.68,
"r_y0": 349.72,
"r_x1": 505.07,
"r_y1": 349.72,
"r_x2": 505.07,
"r_y2": 340.94,
"r_x3": 500.68,
"r_y3": 340.94,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 356.13,
"t": 351.75,
"r": 360.53,
"b": 360.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.13,
"r_y0": 360.53,
"r_x1": 360.53,
"r_y1": 360.53,
"r_x2": 360.53,
"r_y2": 351.75,
"r_x3": 356.13,
"r_y3": 351.75,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 402.54,
"t": 355.88,
"r": 406.93,
"b": 364.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.54,
"r_y0": 364.66,
"r_x1": 406.93,
"r_y1": 364.66,
"r_x2": 406.93,
"r_y2": 355.88,
"r_x3": 402.54,
"r_y3": 355.88,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 448.58,
"t": 352.84,
"r": 452.97,
"b": 361.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.58,
"r_y0": 361.63,
"r_x1": 452.97,
"r_y1": 361.63,
"r_x2": 452.97,
"r_y2": 352.84,
"r_x3": 448.58,
"r_y3": 352.84,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 491.65,
"t": 353.71,
"r": 496.04,
"b": 362.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.65,
"r_y0": 362.49,
"r_x1": 496.04,
"r_y1": 362.49,
"r_x2": 496.04,
"r_y2": 353.71,
"r_x3": 491.65,
"r_y3": 353.71,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 535.14,
"t": 353.34,
"r": 539.53,
"b": 362.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.14,
"r_y0": 362.12,
"r_x1": 539.53,
"r_y1": 362.12,
"r_x2": 539.53,
"r_y2": 353.34,
"r_x3": 535.14,
"r_y3": 353.34,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 348.83,
"t": 387.1,
"r": 353.22,
"b": 395.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.83,
"r_y0": 395.88,
"r_x1": 353.22,
"r_y1": 395.88,
"r_x2": 353.22,
"r_y2": 387.1,
"r_x3": 348.83,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 389.27,
"t": 375.37,
"r": 393.66,
"b": 384.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.27,
"r_y0": 384.16,
"r_x1": 393.66,
"r_y1": 384.16,
"r_x2": 393.66,
"r_y2": 375.37,
"r_x3": 389.27,
"r_y3": 375.37,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 442.67,
"t": 375.65,
"r": 451.46,
"b": 384.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.67,
"r_y0": 384.43,
"r_x1": 451.46,
"r_y1": 384.43,
"r_x2": 451.46,
"r_y2": 375.65,
"r_x3": 442.67,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 477.44,
"t": 375.53,
"r": 485.9,
"b": 384.32,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.44,
"r_y0": 384.32,
"r_x1": 485.9,
"r_y1": 384.32,
"r_x2": 485.9,
"r_y2": 375.53,
"r_x3": 477.44,
"r_y3": 375.53,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 522.57,
"t": 375.65,
"r": 531.36,
"b": 384.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.57,
"r_y0": 384.43,
"r_x1": 531.36,
"r_y1": 384.43,
"r_x2": 531.36,
"r_y2": 375.65,
"r_x3": 522.57,
"r_y3": 375.65,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 400.23,
"t": 387.11,
"r": 409.01,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.23,
"r_y0": 395.9,
"r_x1": 409.01,
"r_y1": 395.9,
"r_x2": 409.01,
"r_y2": 387.11,
"r_x3": 400.23,
"r_y3": 387.11,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 442.31,
"t": 386.99,
"r": 451.09,
"b": 395.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 395.77,
"r_x1": 451.09,
"r_y1": 395.77,
"r_x2": 451.09,
"r_y2": 386.99,
"r_x3": 442.31,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 478.22,
"t": 387.37,
"r": 487.0,
"b": 396.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.22,
"r_y0": 396.16,
"r_x1": 487.0,
"r_y1": 396.16,
"r_x2": 487.0,
"r_y2": 387.37,
"r_x3": 478.22,
"r_y3": 387.37,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 523.23,
"t": 386.99,
"r": 532.01,
"b": 395.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.23,
"r_y0": 395.77,
"r_x1": 532.01,
"r_y1": 395.77,
"r_x2": 532.01,
"r_y2": 386.99,
"r_x3": 523.23,
"r_y3": 386.99,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 411.57,
"t": 399.42,
"r": 415.96,
"b": 408.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.57,
"r_y0": 408.21,
"r_x1": 415.96,
"r_y1": 408.21,
"r_x2": 415.96,
"r_y2": 399.42,
"r_x3": 411.57,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 415.96,
"t": 399.42,
"r": 420.36,
"b": 408.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.96,
"r_y0": 408.21,
"r_x1": 420.36,
"r_y1": 408.21,
"r_x2": 420.36,
"r_y2": 399.42,
"r_x3": 415.96,
"r_y3": 399.42,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 442.31,
"t": 399.04,
"r": 451.09,
"b": 407.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.31,
"r_y0": 407.82,
"r_x1": 451.09,
"r_y1": 407.82,
"r_x2": 451.09,
"r_y2": 399.04,
"r_x3": 442.31,
"r_y3": 399.04,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 478.78,
"t": 399.0,
"r": 487.56,
"b": 407.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.78,
"r_y0": 407.78,
"r_x1": 487.56,
"r_y1": 407.78,
"r_x2": 487.56,
"r_y2": 399.0,
"r_x3": 478.78,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 523.97,
"t": 398.61,
"r": 532.76,
"b": 407.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.97,
"r_y0": 407.4,
"r_x1": 532.76,
"r_y1": 407.4,
"r_x2": 532.76,
"r_y2": 398.61,
"r_x3": 523.97,
"r_y3": 398.61,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 385.09,
"t": 357.76,
"r": 391.1,
"b": 367.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.09,
"r_y0": 367.89,
"r_x1": 391.1,
"r_y1": 367.89,
"r_x2": 391.1,
"r_y2": 357.76,
"r_x3": 385.09,
"r_y3": 357.76,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 333.43,
"t": 380.73,
"r": 339.44,
"b": 390.86,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.43,
"r_y0": 390.86,
"r_x1": 339.44,
"r_y1": 390.86,
"r_x2": 339.44,
"r_y2": 380.73,
"r_x3": 333.43,
"r_y3": 380.73,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 478.07,
"t": 341.04,
"r": 484.08,
"b": 351.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.07,
"r_y0": 351.17,
"r_x1": 484.08,
"r_y1": 351.17,
"r_x2": 484.08,
"r_y2": 341.04,
"r_x3": 478.07,
"r_y3": 341.04,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 23,
"page_no": 0,
"cluster": {
"id": 23,
"label": "picture",
"bbox": {
"l": 315.72,
"t": 433.82,
"r": 536.84,
"b": 496.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.509,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.69,
"r": 398.5,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.25,
"t": 449.55,
"r": 351.64,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.32,
"r": 337.91,
"b": 483.45,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.88,
"t": 437.59,
"r": 465.88,
"b": 447.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 11,
"page_no": 0,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 315.72,
"t": 433.82,
"r": 536.84,
"b": 496.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 446.47,
"r_x1": 351.64,
"r_y1": 446.47,
"r_x2": 351.64,
"r_y2": 437.69,
"r_x3": 347.25,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.88,
"r_y0": 446.47,
"r_x1": 323.27,
"r_y1": 446.47,
"r_x2": 323.27,
"r_y2": 437.69,
"r_x3": 318.88,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.69,
"r": 398.5,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.47,
"r_x1": 398.5,
"r_y1": 446.47,
"r_x2": 398.5,
"r_y2": 437.69,
"r_x3": 394.1,
"r_y3": 437.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 458.33,
"r_x1": 323.17,
"r_y1": 458.33,
"r_x2": 323.17,
"r_y2": 449.55,
"r_x3": 318.77,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.25,
"t": 449.55,
"r": 351.64,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 458.33,
"r_x1": 351.64,
"r_y1": 458.33,
"r_x2": 351.64,
"r_y2": 449.55,
"r_x3": 347.25,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.33,
"r_x1": 398.5,
"r_y1": 458.33,
"r_x2": 398.5,
"r_y2": 449.55,
"r_x3": 394.1,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 458.33,
"r_x1": 445.35,
"r_y1": 458.33,
"r_x2": 445.35,
"r_y2": 449.55,
"r_x3": 440.96,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 458.33,
"r_x1": 492.21,
"r_y1": 458.33,
"r_x2": 492.21,
"r_y2": 449.55,
"r_x3": 487.81,
"r_y3": 449.55,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.77,
"r_y0": 482.49,
"r_x1": 323.17,
"r_y1": 482.49,
"r_x2": 323.17,
"r_y2": 473.7,
"r_x3": 318.77,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 470.63,
"r_x1": 351.64,
"r_y1": 470.63,
"r_x2": 351.64,
"r_y2": 461.84,
"r_x3": 347.25,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.63,
"r_x1": 402.89,
"r_y1": 470.63,
"r_x2": 402.89,
"r_y2": 461.84,
"r_x3": 394.1,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 470.63,
"r_x1": 449.42,
"r_y1": 470.63,
"r_x2": 449.42,
"r_y2": 461.84,
"r_x3": 440.96,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 470.63,
"r_x1": 496.6,
"r_y1": 470.63,
"r_x2": 496.6,
"r_y2": 461.84,
"r_x3": 487.81,
"r_y3": 461.84,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 482.49,
"r_x1": 356.03,
"r_y1": 482.49,
"r_x2": 356.03,
"r_y2": 473.7,
"r_x3": 347.25,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.49,
"r_x1": 402.89,
"r_y1": 482.49,
"r_x2": 402.89,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 482.49,
"r_x1": 449.74,
"r_y1": 482.49,
"r_x2": 449.74,
"r_y2": 473.7,
"r_x3": 440.96,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 482.49,
"r_x1": 496.6,
"r_y1": 482.49,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.81,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.25,
"r_y0": 493.91,
"r_x1": 356.03,
"r_y1": 493.91,
"r_x2": 356.03,
"r_y2": 485.12,
"r_x3": 347.25,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.91,
"r_x1": 402.89,
"r_y1": 493.91,
"r_x2": 402.89,
"r_y2": 485.12,
"r_x3": 394.1,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.96,
"r_y0": 493.91,
"r_x1": 449.74,
"r_y1": 493.91,
"r_x2": 449.74,
"r_y2": 485.12,
"r_x3": 440.96,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.81,
"r_y0": 493.91,
"r_x1": 496.6,
"r_y1": 493.91,
"r_x2": 496.6,
"r_y2": 485.12,
"r_x3": 487.81,
"r_y3": 485.12,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.25,
"r_x1": 372.71,
"r_y1": 459.25,
"r_x2": 372.71,
"r_y2": 449.12,
"r_x3": 366.7,
"r_y3": 449.12,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.32,
"r": 337.91,
"b": 483.45,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.45,
"r_x1": 337.91,
"r_y1": 483.45,
"r_x2": 337.91,
"r_y2": 473.32,
"r_x3": 331.9,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.88,
"t": 437.59,
"r": 465.88,
"b": 447.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.88,
"r_y0": 447.72,
"r_x1": 465.88,
"r_y1": 447.72,
"r_x2": 465.88,
"r_y2": 437.59,
"r_x3": 459.88,
"r_y3": 437.59,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"lcel",
"lcel",
"lcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 5,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 347.25,
"t": 437.69,
"r": 351.64,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 4,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 5,
"text": "1 2 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.88,
"t": 437.69,
"r": 323.27,
"b": 446.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.77,
"t": 449.55,
"r": 323.17,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 449.12,
"r": 372.71,
"b": 459.25,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4 3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 449.55,
"r": 398.5,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 449.55,
"r": 445.35,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 449.55,
"r": 492.21,
"b": 458.33,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.77,
"t": 473.7,
"r": 323.17,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "8 2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 461.84,
"r": 351.64,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 461.84,
"r": 402.89,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "10",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 461.84,
"r": 449.42,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "11",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 461.84,
"r": 496.6,
"b": 470.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "12",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 473.7,
"r": 356.03,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "13",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.89,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 473.7,
"r": 449.74,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "15",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 473.7,
"r": 496.6,
"b": 482.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "16",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.25,
"t": 485.12,
"r": 356.03,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "17",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 485.12,
"r": 402.89,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 440.96,
"t": 485.12,
"r": 449.74,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.81,
"t": 485.12,
"r": 496.6,
"b": 493.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "20",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "picture",
"id": 16,
"page_no": 0,
"cluster": {
"id": 16,
"label": "picture",
"bbox": {
"l": 315.65,
"t": 228.72,
"r": 537.15,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.609,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.35,
"r": 337.2,
"b": 279.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.03,
"t": 252.68,
"r": 390.04,
"b": 262.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 15,
"page_no": 0,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 315.65,
"t": 228.72,
"r": 537.15,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.652,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.95,
"r_y0": 245.48,
"r_x1": 457.95,
"r_y1": 245.48,
"r_x2": 457.95,
"r_y2": 235.35,
"r_x3": 451.95,
"r_y3": 235.35,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.35,
"r": 337.2,
"b": 279.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.48,
"r_x1": 337.2,
"r_y1": 279.48,
"r_x2": 337.2,
"r_y2": 269.35,
"r_x3": 331.2,
"r_y3": 269.35,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.03,
"t": 252.68,
"r": 390.04,
"b": 262.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.03,
"r_y0": 262.81,
"r_x1": 390.04,
"r_y1": 262.81,
"r_x2": 390.04,
"r_y2": 252.68,
"r_x3": 384.03,
"r_y3": 252.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 1,
"num_cols": 1,
"table_cells": [
{
"bbox": {
"l": 451.95,
"t": 235.35,
"r": 457.95,
"b": 245.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "1",
"column_header": true,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 6,
"page_no": 0,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 514.5,
"r": 545.12,
"b": 559.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.921,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 523.41,
"r_x1": 345.73,
"r_y1": 523.41,
"r_x2": 345.73,
"r_y2": 514.5,
"r_x3": 308.86,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 1:",
"orig": "Figure 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 353.18,
"r_y0": 523.41,
"r_x1": 545.12,
"r_y1": 523.41,
"r_x2": 545.12,
"r_y2": 514.5,
"r_x3": 353.18,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table with subtle, complex features",
"orig": "Picture of a table with subtle, complex features",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 535.36,
"r_x1": 545.12,
"r_y1": 535.36,
"r_x2": 545.12,
"r_y2": 526.46,
"r_x3": 308.86,
"r_y3": 526.46,
"coord_origin": "TOPLEFT"
},
"text": "such as (1) multi-column headers, (2) cell with multi-row",
"orig": "such as (1) multi-column headers, (2) cell with multi-row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 547.32,
"r_x1": 545.12,
"r_y1": 547.32,
"r_x2": 545.12,
"r_y2": 538.41,
"r_x3": 308.86,
"r_y3": 538.41,
"coord_origin": "TOPLEFT"
},
"text": "text and (3) cells with no content. Image from PubTabNet",
"orig": "text and (3) cells with no content. Image from PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 559.27,
"r_x1": 505.69,
"r_y1": 559.27,
"r_x2": 505.69,
"r_y2": 550.37,
"r_x3": 308.86,
"r_y3": 550.37,
"coord_origin": "TOPLEFT"
},
"text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'."
},
{
"label": "text",
"id": 0,
"page_no": 0,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 584.41,
"r": 545.12,
"b": 665.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 593.32,
"r_x1": 545.11,
"r_y1": 593.32,
"r_x2": 545.11,
"r_y2": 584.41,
"r_x3": 320.82,
"r_y3": 584.41,
"coord_origin": "TOPLEFT"
},
"text": "Recently, significant progress has been made with vi-",
"orig": "Recently, significant progress has been made with vi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.27,
"r_x1": 545.12,
"r_y1": 605.27,
"r_x2": 545.12,
"r_y2": 596.36,
"r_x3": 308.86,
"r_y3": 596.36,
"coord_origin": "TOPLEFT"
},
"text": "sion based approaches to extract tables in documents. For",
"orig": "sion based approaches to extract tables in documents. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.23,
"r_x1": 545.12,
"r_y1": 617.23,
"r_x2": 545.12,
"r_y2": 608.32,
"r_x3": 308.86,
"r_y3": 608.32,
"coord_origin": "TOPLEFT"
},
"text": "the sake of completeness, the issue of table extraction from",
"orig": "the sake of completeness, the issue of table extraction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.18,
"r_x1": 545.12,
"r_y1": 629.18,
"r_x2": 545.12,
"r_y2": 620.27,
"r_x3": 308.86,
"r_y3": 620.27,
"coord_origin": "TOPLEFT"
},
"text": "documents is typically decomposed into two separate chal-",
"orig": "documents is typically decomposed into two separate chal-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.14,
"r_x1": 353.69,
"r_y1": 641.14,
"r_x2": 353.69,
"r_y2": 632.23,
"r_x3": 308.86,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "lenges, i.e.",
"orig": "lenges, i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 362.11,
"r_y0": 641.14,
"r_x1": 374.67,
"r_y1": 641.14,
"r_x2": 374.67,
"r_y2": 632.23,
"r_x3": 362.11,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.36,
"r_y0": 641.14,
"r_x1": 545.12,
"r_y1": 641.14,
"r_x2": 545.12,
"r_y2": 632.23,
"r_x3": 377.36,
"r_y3": 632.23,
"coord_origin": "TOPLEFT"
},
"text": "finding the location of the table(s) on a",
"orig": "finding the location of the table(s) on a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.09,
"r_x1": 545.12,
"r_y1": 653.09,
"r_x2": 545.12,
"r_y2": 644.19,
"r_x3": 308.86,
"r_y3": 644.19,
"coord_origin": "TOPLEFT"
},
"text": "document-page and (2) finding the structure of a given table",
"orig": "document-page and (2) finding the structure of a given table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.05,
"r_x1": 375.55,
"r_y1": 665.05,
"r_x2": 375.55,
"r_y2": 656.14,
"r_x3": 308.86,
"r_y3": 656.14,
"coord_origin": "TOPLEFT"
},
"text": "in the document.",
"orig": "in the document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document."
},
{
"label": "text",
"id": 3,
"page_no": 0,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 668.38,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 320.82,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "The first problem is called table-location and has been",
"orig": "The first problem is called table-location and has been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art object-detection networks (e.g. YOLO and later",
"orig": "of-the-art object-detection networks (e.g. YOLO and later",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.11,
"r_y1": 713.15,
"r_x2": 545.11,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "on Mask-RCNN [9]). For all practical purposes, it can be",
"orig": "on Mask-RCNN [9]). For all practical purposes, it can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be"
}
],
"headers": [
{
"label": "page_footer",
"id": 12,
"page_no": 0,
"cluster": {
"id": 12,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.805,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1"
},
{
"label": "page_header",
"id": 9,
"page_no": 0,
"cluster": {
"id": 9,
"label": "page_header",
"bbox": {
"l": 18.34,
"t": 207.82,
"r": 36.34,
"b": 560.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 18.34,
"r_y0": 560.0,
"r_x1": 36.34,
"r_y1": 560.0,
"r_x2": 36.34,
"r_y2": 207.82,
"r_x3": 18.34,
"r_y3": 207.82,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022"
}
]
}
},
{
"page_no": 1,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "considered as a solved problem, given enough ground-truth",
"orig": "considered as a solved problem, given enough ground-truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 112.65,
"r_y1": 96.07,
"r_x2": 112.65,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "data to train on.",
"orig": "data to train on.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 108.48,
"r_x1": 286.36,
"r_y1": 108.48,
"r_x2": 286.36,
"r_y2": 99.57,
"r_x3": 62.07,
"r_y3": 99.57,
"coord_origin": "TOPLEFT"
},
"text": "The second problem is called table-structure decompo-",
"orig": "The second problem is called table-structure decompo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 120.43,
"r_x1": 74.75,
"r_y1": 120.43,
"r_x2": 74.75,
"r_y2": 111.53,
"r_x3": 50.11,
"r_y3": 111.53,
"coord_origin": "TOPLEFT"
},
"text": "sition.",
"orig": "sition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.33,
"r_y0": 120.43,
"r_x1": 286.37,
"r_y1": 120.43,
"r_x2": 286.37,
"r_y2": 111.53,
"r_x3": 81.33,
"r_y3": 111.53,
"coord_origin": "TOPLEFT"
},
"text": "The latter is a long standing problem in the com-",
"orig": "The latter is a long standing problem in the com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 132.39,
"r_x1": 286.37,
"r_y1": 132.39,
"r_x2": 286.37,
"r_y2": 123.48,
"r_x3": 50.11,
"r_y3": 123.48,
"coord_origin": "TOPLEFT"
},
"text": "munity of document understanding [6, 4, 14]. Contrary to",
"orig": "munity of document understanding [6, 4, 14]. Contrary to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 144.34,
"r_x1": 286.37,
"r_y1": 144.34,
"r_x2": 286.37,
"r_y2": 135.44,
"r_x3": 50.11,
"r_y3": 135.44,
"coord_origin": "TOPLEFT"
},
"text": "the table-location problem, there are no commonly used ap-",
"orig": "the table-location problem, there are no commonly used ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 156.3,
"r_x1": 286.37,
"r_y1": 156.3,
"r_x2": 286.37,
"r_y2": 147.39,
"r_x3": 50.11,
"r_y3": 147.39,
"coord_origin": "TOPLEFT"
},
"text": "proaches that can easily be re-purposed to solve this prob-",
"orig": "proaches that can easily be re-purposed to solve this prob-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 168.25,
"r_x1": 286.37,
"r_y1": 168.25,
"r_x2": 286.37,
"r_y2": 159.35,
"r_x3": 50.11,
"r_y3": 159.35,
"coord_origin": "TOPLEFT"
},
"text": "lem. Lately, a set of new model-architectures has been pro-",
"orig": "lem. Lately, a set of new model-architectures has been pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 180.21,
"r_x1": 286.37,
"r_y1": 180.21,
"r_x2": 286.37,
"r_y2": 171.3,
"r_x3": 50.11,
"r_y3": 171.3,
"coord_origin": "TOPLEFT"
},
"text": "posed by the community to address table-structure decom-",
"orig": "posed by the community to address table-structure decom-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 192.16,
"r_x1": 286.37,
"r_y1": 192.16,
"r_x2": 286.37,
"r_y2": 183.26,
"r_x3": 50.11,
"r_y3": 183.26,
"coord_origin": "TOPLEFT"
},
"text": "position [37, 36, 18, 20]. All these models have some weak-",
"orig": "position [37, 36, 18, 20]. All these models have some weak-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 204.12,
"r_x1": 286.37,
"r_y1": 204.12,
"r_x2": 286.37,
"r_y2": 195.21,
"r_x3": 50.11,
"r_y3": 195.21,
"coord_origin": "TOPLEFT"
},
"text": "nesses (see Sec. 2). The common denominator here is the",
"orig": "nesses (see Sec. 2). The common denominator here is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 216.07,
"r_x1": 286.37,
"r_y1": 216.07,
"r_x2": 286.37,
"r_y2": 207.17,
"r_x3": 50.11,
"r_y3": 207.17,
"coord_origin": "TOPLEFT"
},
"text": "reliance on textual features and/or the inability to provide",
"orig": "reliance on textual features and/or the inability to provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 228.03,
"r_x1": 278.66,
"r_y1": 228.03,
"r_x2": 278.66,
"r_y2": 219.12,
"r_x3": 50.11,
"r_y3": 219.12,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table-cell in the original image.",
"orig": "the bounding box of each table-cell in the original image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 240.44,
"r_x1": 286.36,
"r_y1": 240.44,
"r_x2": 286.36,
"r_y2": 231.53,
"r_x3": 62.07,
"r_y3": 231.53,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we want to address these weaknesses and",
"orig": "In this paper, we want to address these weaknesses and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 252.39,
"r_x1": 286.37,
"r_y1": 252.39,
"r_x2": 286.37,
"r_y2": 243.49,
"r_x3": 50.11,
"r_y3": 243.49,
"coord_origin": "TOPLEFT"
},
"text": "present a robust table-structure decomposition algorithm.",
"orig": "present a robust table-structure decomposition algorithm.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.35,
"r_x1": 286.37,
"r_y1": 264.35,
"r_x2": 286.37,
"r_y2": 255.44,
"r_x3": 50.11,
"r_y3": 255.44,
"coord_origin": "TOPLEFT"
},
"text": "The design criteria for our model are the following. First,",
"orig": "The design criteria for our model are the following. First,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.3,
"r_x1": 286.37,
"r_y1": 276.3,
"r_x2": 286.37,
"r_y2": 267.4,
"r_x3": 50.11,
"r_y3": 267.4,
"coord_origin": "TOPLEFT"
},
"text": "we want our algorithm to be language agnostic. In this way,",
"orig": "we want our algorithm to be language agnostic. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.26,
"r_x1": 286.37,
"r_y1": 288.26,
"r_x2": 286.37,
"r_y2": 279.35,
"r_x3": 50.11,
"r_y3": 279.35,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the structure of any table, irregardless of the",
"orig": "we can obtain the structure of any table, irregardless of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.21,
"r_x1": 88.57,
"r_y1": 300.21,
"r_x2": 88.57,
"r_y2": 291.31,
"r_x3": 50.11,
"r_y3": 291.31,
"coord_origin": "TOPLEFT"
},
"text": "language.",
"orig": "language.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 95.5,
"r_y0": 300.21,
"r_x1": 286.37,
"r_y1": 300.21,
"r_x2": 286.37,
"r_y2": 291.31,
"r_x3": 95.5,
"r_y3": 291.31,
"coord_origin": "TOPLEFT"
},
"text": "Second, we want our algorithm to leverage as",
"orig": "Second, we want our algorithm to leverage as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.17,
"r_x1": 286.37,
"r_y1": 312.17,
"r_x2": 286.37,
"r_y2": 303.26,
"r_x3": 50.11,
"r_y3": 303.26,
"coord_origin": "TOPLEFT"
},
"text": "much data as possible from the original PDF document. For",
"orig": "much data as possible from the original PDF document. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.12,
"r_x1": 286.37,
"r_y1": 324.12,
"r_x2": 286.37,
"r_y2": 315.22,
"r_x3": 50.11,
"r_y3": 315.22,
"coord_origin": "TOPLEFT"
},
"text": "programmatic PDF documents, the text-cells can often be",
"orig": "programmatic PDF documents, the text-cells can often be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.08,
"r_x1": 286.37,
"r_y1": 336.08,
"r_x2": 286.37,
"r_y2": 327.17,
"r_x3": 50.11,
"r_y3": 327.17,
"coord_origin": "TOPLEFT"
},
"text": "extracted much faster and with higher accuracy compared",
"orig": "extracted much faster and with higher accuracy compared",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.03,
"r_x1": 286.37,
"r_y1": 348.03,
"r_x2": 286.37,
"r_y2": 339.13,
"r_x3": 50.11,
"r_y3": 339.13,
"coord_origin": "TOPLEFT"
},
"text": "to OCR methods. Last but not least, we want to have a di-",
"orig": "to OCR methods. Last but not least, we want to have a di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.99,
"r_x1": 286.37,
"r_y1": 359.99,
"r_x2": 286.37,
"r_y2": 351.08,
"r_x3": 50.11,
"r_y3": 351.08,
"coord_origin": "TOPLEFT"
},
"text": "rect link between the table-cell and its bounding box in the",
"orig": "rect link between the table-cell and its bounding box in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.95,
"r_x1": 76.95,
"r_y1": 371.95,
"r_x2": 76.95,
"r_y2": 363.04,
"r_x3": 50.11,
"r_y3": 363.04,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 384.35,
"r_x1": 286.36,
"r_y1": 384.35,
"r_x2": 286.36,
"r_y2": 375.45,
"r_x3": 62.07,
"r_y3": 375.45,
"coord_origin": "TOPLEFT"
},
"text": "To meet the design criteria listed above, we developed a",
"orig": "To meet the design criteria listed above, we developed a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.31,
"r_x1": 120.99,
"r_y1": 396.31,
"r_x2": 120.99,
"r_y2": 387.4,
"r_x3": 50.11,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "new model called",
"orig": "new model called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 123.9,
"r_y0": 396.24,
"r_x1": 179.73,
"r_y1": 396.24,
"r_x2": 179.73,
"r_y2": 387.28,
"r_x3": 123.9,
"r_y3": 387.28,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.65,
"r_y0": 396.31,
"r_x1": 286.37,
"r_y1": 396.31,
"r_x2": 286.37,
"r_y2": 387.4,
"r_x3": 182.65,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "and a synthetically gener-",
"orig": "and a synthetically gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 408.26,
"r_x1": 181.76,
"r_y1": 408.26,
"r_x2": 181.76,
"r_y2": 399.36,
"r_x3": 50.11,
"r_y3": 399.36,
"coord_origin": "TOPLEFT"
},
"text": "ated table structure dataset called",
"orig": "ated table structure dataset called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.1,
"r_y0": 408.19,
"r_x1": 240.2,
"r_y1": 408.19,
"r_x2": 240.2,
"r_y2": 399.24,
"r_x3": 184.1,
"r_y3": 399.24,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.2,
"r_y0": 408.26,
"r_x1": 286.36,
"r_y1": 408.26,
"r_x2": 286.36,
"r_y2": 399.36,
"r_x3": 240.2,
"r_y3": 399.36,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$. In partic-",
"orig": "$^{1}$. In partic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 420.22,
"r_x1": 286.37,
"r_y1": 420.22,
"r_x2": 286.37,
"r_y2": 411.31,
"r_x3": 50.11,
"r_y3": 411.31,
"coord_origin": "TOPLEFT"
},
"text": "ular, our contributions in this work can be summarised as",
"orig": "ular, our contributions in this work can be summarised as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 432.17,
"r_x1": 82.52,
"r_y1": 432.17,
"r_x2": 82.52,
"r_y2": 423.27,
"r_x3": 50.11,
"r_y3": 423.27,
"coord_origin": "TOPLEFT"
},
"text": "follows:",
"orig": "follows:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 453.46,
"r_x1": 70.74,
"r_y1": 453.46,
"r_x2": 70.74,
"r_y2": 444.55,
"r_x3": 61.57,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.03,
"r_y0": 453.46,
"r_x1": 117.1,
"r_y1": 453.46,
"r_x2": 117.1,
"r_y2": 444.55,
"r_x3": 73.03,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": "We propose",
"orig": "We propose",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.59,
"r_y0": 453.39,
"r_x1": 175.42,
"r_y1": 453.39,
"r_x2": 175.42,
"r_y2": 444.43,
"r_x3": 119.59,
"r_y3": 444.43,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.42,
"r_y0": 453.46,
"r_x1": 286.36,
"r_y1": 453.46,
"r_x2": 286.36,
"r_y2": 444.55,
"r_x3": 175.42,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": ", a transformer based model",
"orig": ", a transformer based model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 465.41,
"r_x1": 286.36,
"r_y1": 465.41,
"r_x2": 286.36,
"r_y2": 456.51,
"r_x3": 70.04,
"r_y3": 456.51,
"coord_origin": "TOPLEFT"
},
"text": "that predicts tables structure and bounding boxes for",
"orig": "that predicts tables structure and bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 477.37,
"r_x1": 286.36,
"r_y1": 477.37,
"r_x2": 286.36,
"r_y2": 468.46,
"r_x3": 70.04,
"r_y3": 468.46,
"coord_origin": "TOPLEFT"
},
"text": "the table content simultaneously in an end-to-end ap-",
"orig": "the table content simultaneously in an end-to-end ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 489.32,
"r_x1": 99.64,
"r_y1": 489.32,
"r_x2": 99.64,
"r_y2": 480.42,
"r_x3": 70.04,
"r_y3": 480.42,
"coord_origin": "TOPLEFT"
},
"text": "proach.",
"orig": "proach.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 511.06,
"r_x1": 71.62,
"r_y1": 511.06,
"r_x2": 71.62,
"r_y2": 502.15,
"r_x3": 61.57,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.13,
"r_y0": 511.06,
"r_x1": 196.1,
"r_y1": 511.06,
"r_x2": 196.1,
"r_y2": 502.15,
"r_x3": 74.13,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "Across all benchmark datasets",
"orig": "Across all benchmark datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.31,
"r_y0": 510.99,
"r_x1": 256.14,
"r_y1": 510.99,
"r_x2": 256.14,
"r_y2": 502.03,
"r_x3": 200.31,
"r_y3": 502.03,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.35,
"r_y0": 511.06,
"r_x1": 286.36,
"r_y1": 511.06,
"r_x2": 286.36,
"r_y2": 502.15,
"r_x3": 260.35,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "signif-",
"orig": "signif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 523.01,
"r_x1": 286.36,
"r_y1": 523.01,
"r_x2": 286.36,
"r_y2": 514.11,
"r_x3": 70.04,
"r_y3": 514.11,
"coord_origin": "TOPLEFT"
},
"text": "icantly outperforms existing state-of-the-art metrics,",
"orig": "icantly outperforms existing state-of-the-art metrics,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 534.97,
"r_x1": 286.36,
"r_y1": 534.97,
"r_x2": 286.36,
"r_y2": 526.06,
"r_x3": 70.04,
"r_y3": 526.06,
"coord_origin": "TOPLEFT"
},
"text": "while being much more efficient in training and infer-",
"orig": "while being much more efficient in training and infer-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 546.93,
"r_x1": 161.65,
"r_y1": 546.93,
"r_x2": 161.65,
"r_y2": 538.02,
"r_x3": 70.04,
"r_y3": 538.02,
"coord_origin": "TOPLEFT"
},
"text": "ence to existing works.",
"orig": "ence to existing works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 568.66,
"r_x1": 71.12,
"r_y1": 568.66,
"r_x2": 71.12,
"r_y2": 559.76,
"r_x3": 61.57,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 568.66,
"r_x1": 116.71,
"r_y1": 568.66,
"r_x2": 116.71,
"r_y2": 559.76,
"r_x3": 73.5,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "We present",
"orig": "We present",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 121.58,
"r_y0": 568.59,
"r_x1": 177.68,
"r_y1": 568.59,
"r_x2": 177.68,
"r_y2": 559.64,
"r_x3": 121.58,
"r_y3": 559.64,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.55,
"r_y0": 568.66,
"r_x1": 286.36,
"r_y1": 568.66,
"r_x2": 286.36,
"r_y2": 559.76,
"r_x3": 182.55,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "a synthetically generated",
"orig": "a synthetically generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 580.62,
"r_x1": 286.36,
"r_y1": 580.62,
"r_x2": 286.36,
"r_y2": 571.71,
"r_x3": 70.04,
"r_y3": 571.71,
"coord_origin": "TOPLEFT"
},
"text": "dataset, with various appearance styles and complex-",
"orig": "dataset, with various appearance styles and complex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 592.57,
"r_x1": 82.4,
"r_y1": 592.57,
"r_x2": 82.4,
"r_y2": 583.67,
"r_x3": 70.04,
"r_y3": 583.67,
"coord_origin": "TOPLEFT"
},
"text": "ity.",
"orig": "ity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 614.31,
"r_x1": 72.33,
"r_y1": 614.31,
"r_x2": 72.33,
"r_y2": 605.4,
"r_x3": 61.57,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.02,
"r_y0": 614.31,
"r_x1": 286.37,
"r_y1": 614.31,
"r_x2": 286.37,
"r_y2": 605.4,
"r_x3": 75.02,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "An augmented dataset based on PubTabNet [37],",
"orig": "An augmented dataset based on PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 626.26,
"r_x1": 286.36,
"r_y1": 626.26,
"r_x2": 286.36,
"r_y2": 617.36,
"r_x3": 70.04,
"r_y3": 617.36,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] with generated",
"orig": "FinTabNet [36], and TableBank [17] with generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 638.22,
"r_x1": 198.06,
"r_y1": 638.22,
"r_x2": 198.06,
"r_y2": 629.31,
"r_x3": 70.04,
"r_y3": 629.31,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth for reproducibility.",
"orig": "ground-truth for reproducibility.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 659.5,
"r_x1": 286.36,
"r_y1": 659.5,
"r_x2": 286.36,
"r_y2": 650.6,
"r_x3": 62.07,
"r_y3": 650.6,
"coord_origin": "TOPLEFT"
},
"text": "The paper is structured as follows. In Sec. 2, we give",
"orig": "The paper is structured as follows. In Sec. 2, we give",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 671.46,
"r_x1": 286.37,
"r_y1": 671.46,
"r_x2": 286.37,
"r_y2": 662.55,
"r_x3": 50.11,
"r_y3": 662.55,
"coord_origin": "TOPLEFT"
},
"text": "a brief overview of the current state-of-the-art. In Sec. 3,",
"orig": "a brief overview of the current state-of-the-art. In Sec. 3,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 683.41,
"r_x1": 286.37,
"r_y1": 683.41,
"r_x2": 286.37,
"r_y2": 674.51,
"r_x3": 50.11,
"r_y3": 674.51,
"coord_origin": "TOPLEFT"
},
"text": "we describe the datasets on which we train. In Sec. 4, we",
"orig": "we describe the datasets on which we train. In Sec. 4, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 695.37,
"r_x1": 286.37,
"r_y1": 695.37,
"r_x2": 286.37,
"r_y2": 686.46,
"r_x3": 50.11,
"r_y3": 686.46,
"coord_origin": "TOPLEFT"
},
"text": "introduce the TableFormer model-architecture and describe",
"orig": "introduce the TableFormer model-architecture and describe",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.97,
"r_y0": 712.72,
"r_x1": 183.73,
"r_y1": 712.72,
"r_x2": 183.73,
"r_y2": 705.6,
"r_x3": 60.97,
"r_y3": 705.6,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet",
"orig": "$^{1}$https://github.com/IBM/SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 545.12,
"r_y1": 84.11,
"r_x2": 545.12,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "its results & performance in Sec. 5. As a conclusion, we de-",
"orig": "its results & performance in Sec. 5. As a conclusion, we de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "scribe how this new model-architecture can be re-purposed",
"orig": "scribe how this new model-architecture can be re-purposed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 508.08,
"r_y1": 108.02,
"r_x2": 508.08,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "for other tasks in the computer-vision community.",
"orig": "for other tasks in the computer-vision community.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 132.48,
"r_x1": 315.58,
"r_y1": 132.48,
"r_x2": 315.58,
"r_y2": 121.73,
"r_x3": 308.86,
"r_y3": 121.73,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 324.54,
"r_y0": 132.48,
"r_x1": 498.28,
"r_y1": 132.48,
"r_x2": 498.28,
"r_y2": 121.73,
"r_x3": 324.54,
"r_y3": 121.73,
"coord_origin": "TOPLEFT"
},
"text": "Previous work and State of the Art",
"orig": "Previous work and State of the Art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 151.13,
"r_x1": 545.11,
"r_y1": 151.13,
"r_x2": 545.11,
"r_y2": 142.22,
"r_x3": 320.82,
"r_y3": 142.22,
"coord_origin": "TOPLEFT"
},
"text": "Identifying the structure of a table has been an outstand-",
"orig": "Identifying the structure of a table has been an outstand-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 163.08,
"r_x1": 545.12,
"r_y1": 163.08,
"r_x2": 545.12,
"r_y2": 154.18,
"r_x3": 308.86,
"r_y3": 154.18,
"coord_origin": "TOPLEFT"
},
"text": "ing problem in the document-parsing community, that mo-",
"orig": "ing problem in the document-parsing community, that mo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 175.04,
"r_x1": 522.56,
"r_y1": 175.04,
"r_x2": 522.56,
"r_y2": 166.13,
"r_x3": 308.86,
"r_y3": 166.13,
"coord_origin": "TOPLEFT"
},
"text": "tivates many organised public challenges [6, 4, 14].",
"orig": "tivates many organised public challenges [6, 4, 14].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 175.04,
"r_x1": 545.12,
"r_y1": 175.04,
"r_x2": 545.12,
"r_y2": 166.13,
"r_x3": 529.62,
"r_y3": 166.13,
"coord_origin": "TOPLEFT"
},
"text": "The",
"orig": "The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 186.99,
"r_x1": 545.12,
"r_y1": 186.99,
"r_x2": 545.12,
"r_y2": 178.09,
"r_x3": 308.86,
"r_y3": 178.09,
"coord_origin": "TOPLEFT"
},
"text": "difficulty of the problem can be attributed to a number of",
"orig": "difficulty of the problem can be attributed to a number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 198.95,
"r_x1": 545.12,
"r_y1": 198.95,
"r_x2": 545.12,
"r_y2": 190.04,
"r_x3": 308.86,
"r_y3": 190.04,
"coord_origin": "TOPLEFT"
},
"text": "factors. First, there is a large variety in the shapes and sizes",
"orig": "factors. First, there is a large variety in the shapes and sizes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 210.9,
"r_x1": 346.98,
"r_y1": 210.9,
"r_x2": 346.98,
"r_y2": 202.0,
"r_x3": 308.86,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "of tables.",
"orig": "of tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.87,
"r_y0": 210.9,
"r_x1": 545.12,
"r_y1": 210.9,
"r_x2": 545.12,
"r_y2": 202.0,
"r_x3": 354.87,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "Such large variety requires a flexible method.",
"orig": "Such large variety requires a flexible method.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 222.86,
"r_x1": 545.12,
"r_y1": 222.86,
"r_x2": 545.12,
"r_y2": 213.95,
"r_x3": 308.86,
"r_y3": 213.95,
"coord_origin": "TOPLEFT"
},
"text": "This is especially true for complex column- and row head-",
"orig": "This is especially true for complex column- and row head-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 234.81,
"r_x1": 530.92,
"r_y1": 234.81,
"r_x2": 530.92,
"r_y2": 225.91,
"r_x3": 308.86,
"r_y3": 225.91,
"coord_origin": "TOPLEFT"
},
"text": "ers, which can be extremely intricate and demanding.",
"orig": "ers, which can be extremely intricate and demanding.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.92,
"r_y0": 234.81,
"r_x1": 545.12,
"r_y1": 234.81,
"r_x2": 545.12,
"r_y2": 225.91,
"r_x3": 537.92,
"r_y3": 225.91,
"coord_origin": "TOPLEFT"
},
"text": "A",
"orig": "A",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 246.77,
"r_x1": 545.12,
"r_y1": 246.77,
"r_x2": 545.12,
"r_y2": 237.86,
"r_x3": 308.86,
"r_y3": 237.86,
"coord_origin": "TOPLEFT"
},
"text": "second factor of complexity is the lack of data with regard",
"orig": "second factor of complexity is the lack of data with regard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.72,
"r_x1": 545.12,
"r_y1": 258.72,
"r_x2": 545.12,
"r_y2": 249.82,
"r_x3": 308.86,
"r_y3": 249.82,
"coord_origin": "TOPLEFT"
},
"text": "to table-structure. Until the publication of PubTabNet [37],",
"orig": "to table-structure. Until the publication of PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.68,
"r_x1": 439.84,
"r_y1": 270.68,
"r_x2": 439.84,
"r_y2": 261.77,
"r_x3": 308.86,
"r_y3": 261.77,
"coord_origin": "TOPLEFT"
},
"text": "there were no large datasets (i.e.",
"orig": "there were no large datasets (i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.44,
"r_y0": 270.46,
"r_x1": 452.19,
"r_y1": 270.46,
"r_x2": 452.19,
"r_y2": 261.61,
"r_x3": 444.44,
"r_y3": 261.61,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.89,
"r_y0": 270.46,
"r_x1": 470.83,
"r_y1": 270.46,
"r_x2": 470.83,
"r_y2": 261.61,
"r_x3": 455.89,
"r_y3": 261.61,
"coord_origin": "TOPLEFT"
},
"text": "100",
"orig": "100",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 470.83,
"r_y0": 270.68,
"r_x1": 545.12,
"r_y1": 270.68,
"r_x2": 545.12,
"r_y2": 261.77,
"r_x3": 470.83,
"r_y3": 261.77,
"coord_origin": "TOPLEFT"
},
"text": "K tables) that pro-",
"orig": "K tables) that pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.63,
"r_x1": 545.12,
"r_y1": 282.63,
"r_x2": 545.12,
"r_y2": 273.73,
"r_x3": 308.86,
"r_y3": 273.73,
"coord_origin": "TOPLEFT"
},
"text": "vided structure information. This happens primarily due to",
"orig": "vided structure information. This happens primarily due to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.59,
"r_x1": 545.12,
"r_y1": 294.59,
"r_x2": 545.12,
"r_y2": 285.68,
"r_x3": 308.86,
"r_y3": 285.68,
"coord_origin": "TOPLEFT"
},
"text": "the fact that tables are notoriously time-consuming to an-",
"orig": "the fact that tables are notoriously time-consuming to an-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 306.55,
"r_x1": 545.12,
"r_y1": 306.55,
"r_x2": 545.12,
"r_y2": 297.64,
"r_x3": 308.86,
"r_y3": 297.64,
"coord_origin": "TOPLEFT"
},
"text": "notate by hand. However, this has definitely changed in re-",
"orig": "notate by hand. However, this has definitely changed in re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 318.5,
"r_x1": 545.12,
"r_y1": 318.5,
"r_x2": 545.12,
"r_y2": 309.59,
"r_x3": 308.86,
"r_y3": 309.59,
"coord_origin": "TOPLEFT"
},
"text": "cent years with the deliverance of PubTabNet [37], FinTab-",
"orig": "cent years with the deliverance of PubTabNet [37], FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 330.46,
"r_x1": 425.92,
"r_y1": 330.46,
"r_x2": 425.92,
"r_y2": 321.55,
"r_x3": 308.86,
"r_y3": 321.55,
"coord_origin": "TOPLEFT"
},
"text": "Net [36], TableBank [17] etc.",
"orig": "Net [36], TableBank [17] etc.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 342.48,
"r_x1": 545.11,
"r_y1": 342.48,
"r_x2": 545.11,
"r_y2": 333.57,
"r_x3": 320.82,
"r_y3": 333.57,
"coord_origin": "TOPLEFT"
},
"text": "Before the rising popularity of deep neural networks,",
"orig": "Before the rising popularity of deep neural networks,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 354.43,
"r_x1": 545.11,
"r_y1": 354.43,
"r_x2": 545.11,
"r_y2": 345.52,
"r_x3": 308.86,
"r_y3": 345.52,
"coord_origin": "TOPLEFT"
},
"text": "the community relied heavily on heuristic and/or statistical",
"orig": "the community relied heavily on heuristic and/or statistical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 366.39,
"r_x1": 545.12,
"r_y1": 366.39,
"r_x2": 545.12,
"r_y2": 357.48,
"r_x3": 308.86,
"r_y3": 357.48,
"coord_origin": "TOPLEFT"
},
"text": "methods to do table structure identification [3, 7, 11, 5, 13,",
"orig": "methods to do table structure identification [3, 7, 11, 5, 13,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 378.34,
"r_x1": 545.12,
"r_y1": 378.34,
"r_x2": 545.12,
"r_y2": 369.44,
"r_x3": 308.86,
"r_y3": 369.44,
"coord_origin": "TOPLEFT"
},
"text": "28]. Although such methods work well on constrained ta-",
"orig": "28]. Although such methods work well on constrained ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 390.3,
"r_x1": 545.12,
"r_y1": 390.3,
"r_x2": 545.12,
"r_y2": 381.39,
"r_x3": 308.86,
"r_y3": 381.39,
"coord_origin": "TOPLEFT"
},
"text": "bles [12], a more data-driven approach can be applied due",
"orig": "bles [12], a more data-driven approach can be applied due",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 402.25,
"r_x1": 545.12,
"r_y1": 402.25,
"r_x2": 545.12,
"r_y2": 393.35,
"r_x3": 308.86,
"r_y3": 393.35,
"coord_origin": "TOPLEFT"
},
"text": "to the advent of convolutional neural networks (CNNs) and",
"orig": "to the advent of convolutional neural networks (CNNs) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 414.21,
"r_x1": 545.12,
"r_y1": 414.21,
"r_x2": 545.12,
"r_y2": 405.3,
"r_x3": 308.86,
"r_y3": 405.3,
"coord_origin": "TOPLEFT"
},
"text": "the availability of large datasets. To the best-of-our knowl-",
"orig": "the availability of large datasets. To the best-of-our knowl-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 426.16,
"r_x1": 545.12,
"r_y1": 426.16,
"r_x2": 545.12,
"r_y2": 417.26,
"r_x3": 308.86,
"r_y3": 417.26,
"coord_origin": "TOPLEFT"
},
"text": "edge, there are currently two different types of network ar-",
"orig": "edge, there are currently two different types of network ar-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 438.12,
"r_x1": 545.12,
"r_y1": 438.12,
"r_x2": 545.12,
"r_y2": 429.21,
"r_x3": 308.86,
"r_y3": 429.21,
"coord_origin": "TOPLEFT"
},
"text": "chitecture that are being pursued for state-of-the-art table-",
"orig": "chitecture that are being pursued for state-of-the-art table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 450.07,
"r_x1": 401.29,
"r_y1": 450.07,
"r_x2": 401.29,
"r_y2": 441.17,
"r_x3": 308.86,
"r_y3": 441.17,
"coord_origin": "TOPLEFT"
},
"text": "structure identification.",
"orig": "structure identification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 462.02,
"r_x1": 423.26,
"r_y1": 462.02,
"r_x2": 423.26,
"r_y2": 453.07,
"r_x3": 320.82,
"r_y3": 453.07,
"coord_origin": "TOPLEFT"
},
"text": "Image-to-Text networks",
"orig": "Image-to-Text networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.27,
"r_y0": 462.09,
"r_x1": 545.11,
"r_y1": 462.09,
"r_x2": 545.11,
"r_y2": 453.19,
"r_x3": 423.27,
"r_y3": 453.19,
"coord_origin": "TOPLEFT"
},
"text": ": In this type of network, one",
"orig": ": In this type of network, one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 474.05,
"r_x1": 545.12,
"r_y1": 474.05,
"r_x2": 545.12,
"r_y2": 465.14,
"r_x3": 308.86,
"r_y3": 465.14,
"coord_origin": "TOPLEFT"
},
"text": "predicts a sequence of tokens starting from an encoded",
"orig": "predicts a sequence of tokens starting from an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 486.0,
"r_x1": 335.7,
"r_y1": 486.0,
"r_x2": 335.7,
"r_y2": 477.1,
"r_x3": 308.86,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.85,
"r_y0": 486.0,
"r_x1": 545.12,
"r_y1": 486.0,
"r_x2": 545.12,
"r_y2": 477.1,
"r_x3": 345.85,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "Such sequences of tokens can be HTML table",
"orig": "Such sequences of tokens can be HTML table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.96,
"r_x1": 545.11,
"r_y1": 497.96,
"r_x2": 545.11,
"r_y2": 489.05,
"r_x3": 308.86,
"r_y3": 489.05,
"coord_origin": "TOPLEFT"
},
"text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.91,
"r_x1": 545.11,
"r_y1": 509.91,
"r_x2": 545.11,
"r_y2": 501.01,
"r_x3": 308.86,
"r_y3": 501.01,
"coord_origin": "TOPLEFT"
},
"text": "bols is ultimately not very important, since one can be trans-",
"orig": "bols is ultimately not very important, since one can be trans-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.87,
"r_x1": 545.12,
"r_y1": 521.87,
"r_x2": 545.12,
"r_y2": 512.96,
"r_x3": 308.86,
"r_y3": 512.96,
"coord_origin": "TOPLEFT"
},
"text": "formed into the other. There are however subtle variations",
"orig": "formed into the other. There are however subtle variations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.82,
"r_x1": 545.12,
"r_y1": 533.82,
"r_x2": 545.12,
"r_y2": 524.92,
"r_x3": 308.86,
"r_y3": 524.92,
"coord_origin": "TOPLEFT"
},
"text": "in the Image-to-Text networks. The easiest network archi-",
"orig": "in the Image-to-Text networks. The easiest network archi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.78,
"r_x1": 420.94,
"r_y1": 545.78,
"r_x2": 420.94,
"r_y2": 536.87,
"r_x3": 308.86,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "tectures are \u201cimage-encoder",
"orig": "tectures are \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.59,
"r_y0": 545.56,
"r_x1": 433.56,
"r_y1": 545.56,
"r_x2": 433.56,
"r_y2": 536.16,
"r_x3": 423.59,
"r_y3": 536.16,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.21,
"r_y0": 545.78,
"r_x1": 545.11,
"r_y1": 545.78,
"r_x2": 545.11,
"r_y2": 536.87,
"r_x3": 436.21,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "text-decoder\u201d (IETD), sim-",
"orig": "text-decoder\u201d (IETD), sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.73,
"r_x1": 545.12,
"r_y1": 557.73,
"r_x2": 545.12,
"r_y2": 548.83,
"r_x3": 308.86,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "ilar to network architectures that try to provide captions to",
"orig": "ilar to network architectures that try to provide captions to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.69,
"r_x1": 545.11,
"r_y1": 569.69,
"r_x2": 545.11,
"r_y2": 560.78,
"r_x3": 308.86,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "images [32]. In these IETD networks, one expects as output",
"orig": "images [32]. In these IETD networks, one expects as output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.64,
"r_x1": 545.11,
"r_y1": 581.64,
"r_x2": 545.11,
"r_y2": 572.74,
"r_x3": 308.86,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"orig": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.6,
"r_x1": 545.12,
"r_y1": 593.6,
"r_x2": 545.12,
"r_y2": 584.69,
"r_x3": 308.86,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "bols necessary for creating the table with the content of the",
"orig": "bols necessary for creating the table with the content of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.56,
"r_x1": 497.08,
"r_y1": 605.56,
"r_x2": 497.08,
"r_y2": 596.65,
"r_x3": 308.86,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "table. Another approach is the \u201cimage-encoder",
"orig": "table. Another approach is the \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.8,
"r_y0": 605.34,
"r_x1": 509.77,
"r_y1": 605.34,
"r_x2": 509.77,
"r_y2": 595.93,
"r_x3": 499.8,
"r_y3": 595.93,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.5,
"r_y0": 605.56,
"r_x1": 545.11,
"r_y1": 605.56,
"r_x2": 545.11,
"r_y2": 596.65,
"r_x3": 512.5,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "dual de-",
"orig": "dual de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.51,
"r_x1": 545.12,
"r_y1": 617.51,
"r_x2": 545.12,
"r_y2": 608.6,
"r_x3": 308.86,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "coder\u201d (IEDD) networks. In these type of networks, one has",
"orig": "coder\u201d (IEDD) networks. In these type of networks, one has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.47,
"r_x1": 545.12,
"r_y1": 629.47,
"r_x2": 545.12,
"r_y2": 620.56,
"r_x3": 308.86,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "two consecutive decoders with different purposes. The first",
"orig": "two consecutive decoders with different purposes. The first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.42,
"r_x1": 364.78,
"r_y1": 641.42,
"r_x2": 364.78,
"r_y2": 632.51,
"r_x3": 308.86,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "decoder is the",
"orig": "decoder is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.57,
"r_y0": 641.19,
"r_x1": 415.61,
"r_y1": 641.19,
"r_x2": 415.61,
"r_y2": 632.6,
"r_x3": 367.57,
"r_y3": 632.6,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.61,
"r_y0": 641.42,
"r_x1": 545.12,
"r_y1": 641.42,
"r_x2": 545.12,
"r_y2": 632.51,
"r_x3": 415.61,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": ", i.e. it only produces the HTM-",
"orig": ", i.e. it only produces the HTM-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.38,
"r_x1": 545.12,
"r_y1": 653.38,
"r_x2": 545.12,
"r_y2": 644.47,
"r_x3": 308.86,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "L/LaTeX tags which construct an empty table. The second",
"orig": "L/LaTeX tags which construct an empty table. The second",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.1,
"r_x1": 373.6,
"r_y1": 665.1,
"r_x2": 373.6,
"r_y2": 656.51,
"r_x3": 308.86,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "content-decoder",
"orig": "content-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.91,
"r_y0": 665.33,
"r_x1": 545.12,
"r_y1": 665.33,
"r_x2": 545.12,
"r_y2": 656.43,
"r_x3": 376.91,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "uses the encoding of the image in combi-",
"orig": "uses the encoding of the image in combi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.12,
"r_y1": 677.29,
"r_x2": 545.12,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "nation with the output encoding of each cell-tag (from the",
"orig": "nation with the output encoding of each cell-tag (from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.01,
"r_x1": 356.9,
"r_y1": 689.01,
"r_x2": 356.9,
"r_y2": 680.42,
"r_x3": 308.86,
"r_y3": 680.42,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.13,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 357.13,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": ") to generate the textual content of each table",
"orig": ") to generate the textual content of each table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "cell. The network architecture of IEDD is certainly more",
"orig": "cell. The network architecture of IEDD is certainly more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "elaborate, but it has the advantage that one can pre-train the",
"orig": "elaborate, but it has the advantage that one can pre-train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 12,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 96.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.966,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "considered as a solved problem, given enough ground-truth",
"orig": "considered as a solved problem, given enough ground-truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 112.65,
"r_y1": 96.07,
"r_x2": 112.65,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "data to train on.",
"orig": "data to train on.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 99.57,
"r": 286.37,
"b": 228.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 108.48,
"r_x1": 286.36,
"r_y1": 108.48,
"r_x2": 286.36,
"r_y2": 99.57,
"r_x3": 62.07,
"r_y3": 99.57,
"coord_origin": "TOPLEFT"
},
"text": "The second problem is called table-structure decompo-",
"orig": "The second problem is called table-structure decompo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 120.43,
"r_x1": 74.75,
"r_y1": 120.43,
"r_x2": 74.75,
"r_y2": 111.53,
"r_x3": 50.11,
"r_y3": 111.53,
"coord_origin": "TOPLEFT"
},
"text": "sition.",
"orig": "sition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.33,
"r_y0": 120.43,
"r_x1": 286.37,
"r_y1": 120.43,
"r_x2": 286.37,
"r_y2": 111.53,
"r_x3": 81.33,
"r_y3": 111.53,
"coord_origin": "TOPLEFT"
},
"text": "The latter is a long standing problem in the com-",
"orig": "The latter is a long standing problem in the com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 132.39,
"r_x1": 286.37,
"r_y1": 132.39,
"r_x2": 286.37,
"r_y2": 123.48,
"r_x3": 50.11,
"r_y3": 123.48,
"coord_origin": "TOPLEFT"
},
"text": "munity of document understanding [6, 4, 14]. Contrary to",
"orig": "munity of document understanding [6, 4, 14]. Contrary to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 144.34,
"r_x1": 286.37,
"r_y1": 144.34,
"r_x2": 286.37,
"r_y2": 135.44,
"r_x3": 50.11,
"r_y3": 135.44,
"coord_origin": "TOPLEFT"
},
"text": "the table-location problem, there are no commonly used ap-",
"orig": "the table-location problem, there are no commonly used ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 156.3,
"r_x1": 286.37,
"r_y1": 156.3,
"r_x2": 286.37,
"r_y2": 147.39,
"r_x3": 50.11,
"r_y3": 147.39,
"coord_origin": "TOPLEFT"
},
"text": "proaches that can easily be re-purposed to solve this prob-",
"orig": "proaches that can easily be re-purposed to solve this prob-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 168.25,
"r_x1": 286.37,
"r_y1": 168.25,
"r_x2": 286.37,
"r_y2": 159.35,
"r_x3": 50.11,
"r_y3": 159.35,
"coord_origin": "TOPLEFT"
},
"text": "lem. Lately, a set of new model-architectures has been pro-",
"orig": "lem. Lately, a set of new model-architectures has been pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 180.21,
"r_x1": 286.37,
"r_y1": 180.21,
"r_x2": 286.37,
"r_y2": 171.3,
"r_x3": 50.11,
"r_y3": 171.3,
"coord_origin": "TOPLEFT"
},
"text": "posed by the community to address table-structure decom-",
"orig": "posed by the community to address table-structure decom-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 192.16,
"r_x1": 286.37,
"r_y1": 192.16,
"r_x2": 286.37,
"r_y2": 183.26,
"r_x3": 50.11,
"r_y3": 183.26,
"coord_origin": "TOPLEFT"
},
"text": "position [37, 36, 18, 20]. All these models have some weak-",
"orig": "position [37, 36, 18, 20]. All these models have some weak-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 204.12,
"r_x1": 286.37,
"r_y1": 204.12,
"r_x2": 286.37,
"r_y2": 195.21,
"r_x3": 50.11,
"r_y3": 195.21,
"coord_origin": "TOPLEFT"
},
"text": "nesses (see Sec. 2). The common denominator here is the",
"orig": "nesses (see Sec. 2). The common denominator here is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 216.07,
"r_x1": 286.37,
"r_y1": 216.07,
"r_x2": 286.37,
"r_y2": 207.17,
"r_x3": 50.11,
"r_y3": 207.17,
"coord_origin": "TOPLEFT"
},
"text": "reliance on textual features and/or the inability to provide",
"orig": "reliance on textual features and/or the inability to provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 228.03,
"r_x1": 278.66,
"r_y1": 228.03,
"r_x2": 278.66,
"r_y2": 219.12,
"r_x3": 50.11,
"r_y3": 219.12,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table-cell in the original image.",
"orig": "the bounding box of each table-cell in the original image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 231.53,
"r": 286.37,
"b": 371.95,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 240.44,
"r_x1": 286.36,
"r_y1": 240.44,
"r_x2": 286.36,
"r_y2": 231.53,
"r_x3": 62.07,
"r_y3": 231.53,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we want to address these weaknesses and",
"orig": "In this paper, we want to address these weaknesses and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 252.39,
"r_x1": 286.37,
"r_y1": 252.39,
"r_x2": 286.37,
"r_y2": 243.49,
"r_x3": 50.11,
"r_y3": 243.49,
"coord_origin": "TOPLEFT"
},
"text": "present a robust table-structure decomposition algorithm.",
"orig": "present a robust table-structure decomposition algorithm.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.35,
"r_x1": 286.37,
"r_y1": 264.35,
"r_x2": 286.37,
"r_y2": 255.44,
"r_x3": 50.11,
"r_y3": 255.44,
"coord_origin": "TOPLEFT"
},
"text": "The design criteria for our model are the following. First,",
"orig": "The design criteria for our model are the following. First,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.3,
"r_x1": 286.37,
"r_y1": 276.3,
"r_x2": 286.37,
"r_y2": 267.4,
"r_x3": 50.11,
"r_y3": 267.4,
"coord_origin": "TOPLEFT"
},
"text": "we want our algorithm to be language agnostic. In this way,",
"orig": "we want our algorithm to be language agnostic. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.26,
"r_x1": 286.37,
"r_y1": 288.26,
"r_x2": 286.37,
"r_y2": 279.35,
"r_x3": 50.11,
"r_y3": 279.35,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the structure of any table, irregardless of the",
"orig": "we can obtain the structure of any table, irregardless of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.21,
"r_x1": 88.57,
"r_y1": 300.21,
"r_x2": 88.57,
"r_y2": 291.31,
"r_x3": 50.11,
"r_y3": 291.31,
"coord_origin": "TOPLEFT"
},
"text": "language.",
"orig": "language.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 95.5,
"r_y0": 300.21,
"r_x1": 286.37,
"r_y1": 300.21,
"r_x2": 286.37,
"r_y2": 291.31,
"r_x3": 95.5,
"r_y3": 291.31,
"coord_origin": "TOPLEFT"
},
"text": "Second, we want our algorithm to leverage as",
"orig": "Second, we want our algorithm to leverage as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.17,
"r_x1": 286.37,
"r_y1": 312.17,
"r_x2": 286.37,
"r_y2": 303.26,
"r_x3": 50.11,
"r_y3": 303.26,
"coord_origin": "TOPLEFT"
},
"text": "much data as possible from the original PDF document. For",
"orig": "much data as possible from the original PDF document. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.12,
"r_x1": 286.37,
"r_y1": 324.12,
"r_x2": 286.37,
"r_y2": 315.22,
"r_x3": 50.11,
"r_y3": 315.22,
"coord_origin": "TOPLEFT"
},
"text": "programmatic PDF documents, the text-cells can often be",
"orig": "programmatic PDF documents, the text-cells can often be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.08,
"r_x1": 286.37,
"r_y1": 336.08,
"r_x2": 286.37,
"r_y2": 327.17,
"r_x3": 50.11,
"r_y3": 327.17,
"coord_origin": "TOPLEFT"
},
"text": "extracted much faster and with higher accuracy compared",
"orig": "extracted much faster and with higher accuracy compared",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.03,
"r_x1": 286.37,
"r_y1": 348.03,
"r_x2": 286.37,
"r_y2": 339.13,
"r_x3": 50.11,
"r_y3": 339.13,
"coord_origin": "TOPLEFT"
},
"text": "to OCR methods. Last but not least, we want to have a di-",
"orig": "to OCR methods. Last but not least, we want to have a di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.99,
"r_x1": 286.37,
"r_y1": 359.99,
"r_x2": 286.37,
"r_y2": 351.08,
"r_x3": 50.11,
"r_y3": 351.08,
"coord_origin": "TOPLEFT"
},
"text": "rect link between the table-cell and its bounding box in the",
"orig": "rect link between the table-cell and its bounding box in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.95,
"r_x1": 76.95,
"r_y1": 371.95,
"r_x2": 76.95,
"r_y2": 363.04,
"r_x3": 50.11,
"r_y3": 363.04,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 375.45,
"r": 286.37,
"b": 432.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 384.35,
"r_x1": 286.36,
"r_y1": 384.35,
"r_x2": 286.36,
"r_y2": 375.45,
"r_x3": 62.07,
"r_y3": 375.45,
"coord_origin": "TOPLEFT"
},
"text": "To meet the design criteria listed above, we developed a",
"orig": "To meet the design criteria listed above, we developed a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.31,
"r_x1": 120.99,
"r_y1": 396.31,
"r_x2": 120.99,
"r_y2": 387.4,
"r_x3": 50.11,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "new model called",
"orig": "new model called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 123.9,
"r_y0": 396.24,
"r_x1": 179.73,
"r_y1": 396.24,
"r_x2": 179.73,
"r_y2": 387.28,
"r_x3": 123.9,
"r_y3": 387.28,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.65,
"r_y0": 396.31,
"r_x1": 286.37,
"r_y1": 396.31,
"r_x2": 286.37,
"r_y2": 387.4,
"r_x3": 182.65,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "and a synthetically gener-",
"orig": "and a synthetically gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 408.26,
"r_x1": 181.76,
"r_y1": 408.26,
"r_x2": 181.76,
"r_y2": 399.36,
"r_x3": 50.11,
"r_y3": 399.36,
"coord_origin": "TOPLEFT"
},
"text": "ated table structure dataset called",
"orig": "ated table structure dataset called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.1,
"r_y0": 408.19,
"r_x1": 240.2,
"r_y1": 408.19,
"r_x2": 240.2,
"r_y2": 399.24,
"r_x3": 184.1,
"r_y3": 399.24,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.2,
"r_y0": 408.26,
"r_x1": 286.36,
"r_y1": 408.26,
"r_x2": 286.36,
"r_y2": 399.36,
"r_x3": 240.2,
"r_y3": 399.36,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$. In partic-",
"orig": "$^{1}$. In partic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 420.22,
"r_x1": 286.37,
"r_y1": 420.22,
"r_x2": 286.37,
"r_y2": 411.31,
"r_x3": 50.11,
"r_y3": 411.31,
"coord_origin": "TOPLEFT"
},
"text": "ular, our contributions in this work can be summarised as",
"orig": "ular, our contributions in this work can be summarised as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 432.17,
"r_x1": 82.52,
"r_y1": 432.17,
"r_x2": 82.52,
"r_y2": 423.27,
"r_x3": 50.11,
"r_y3": 423.27,
"coord_origin": "TOPLEFT"
},
"text": "follows:",
"orig": "follows:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 444.43,
"r": 286.36,
"b": 489.32,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 453.46,
"r_x1": 70.74,
"r_y1": 453.46,
"r_x2": 70.74,
"r_y2": 444.55,
"r_x3": 61.57,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.03,
"r_y0": 453.46,
"r_x1": 117.1,
"r_y1": 453.46,
"r_x2": 117.1,
"r_y2": 444.55,
"r_x3": 73.03,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": "We propose",
"orig": "We propose",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.59,
"r_y0": 453.39,
"r_x1": 175.42,
"r_y1": 453.39,
"r_x2": 175.42,
"r_y2": 444.43,
"r_x3": 119.59,
"r_y3": 444.43,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.42,
"r_y0": 453.46,
"r_x1": 286.36,
"r_y1": 453.46,
"r_x2": 286.36,
"r_y2": 444.55,
"r_x3": 175.42,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": ", a transformer based model",
"orig": ", a transformer based model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 465.41,
"r_x1": 286.36,
"r_y1": 465.41,
"r_x2": 286.36,
"r_y2": 456.51,
"r_x3": 70.04,
"r_y3": 456.51,
"coord_origin": "TOPLEFT"
},
"text": "that predicts tables structure and bounding boxes for",
"orig": "that predicts tables structure and bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 477.37,
"r_x1": 286.36,
"r_y1": 477.37,
"r_x2": 286.36,
"r_y2": 468.46,
"r_x3": 70.04,
"r_y3": 468.46,
"coord_origin": "TOPLEFT"
},
"text": "the table content simultaneously in an end-to-end ap-",
"orig": "the table content simultaneously in an end-to-end ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 489.32,
"r_x1": 99.64,
"r_y1": 489.32,
"r_x2": 99.64,
"r_y2": 480.42,
"r_x3": 70.04,
"r_y3": 480.42,
"coord_origin": "TOPLEFT"
},
"text": "proach.",
"orig": "proach.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 502.03,
"r": 286.36,
"b": 546.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 511.06,
"r_x1": 71.62,
"r_y1": 511.06,
"r_x2": 71.62,
"r_y2": 502.15,
"r_x3": 61.57,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.13,
"r_y0": 511.06,
"r_x1": 196.1,
"r_y1": 511.06,
"r_x2": 196.1,
"r_y2": 502.15,
"r_x3": 74.13,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "Across all benchmark datasets",
"orig": "Across all benchmark datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.31,
"r_y0": 510.99,
"r_x1": 256.14,
"r_y1": 510.99,
"r_x2": 256.14,
"r_y2": 502.03,
"r_x3": 200.31,
"r_y3": 502.03,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.35,
"r_y0": 511.06,
"r_x1": 286.36,
"r_y1": 511.06,
"r_x2": 286.36,
"r_y2": 502.15,
"r_x3": 260.35,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "signif-",
"orig": "signif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 523.01,
"r_x1": 286.36,
"r_y1": 523.01,
"r_x2": 286.36,
"r_y2": 514.11,
"r_x3": 70.04,
"r_y3": 514.11,
"coord_origin": "TOPLEFT"
},
"text": "icantly outperforms existing state-of-the-art metrics,",
"orig": "icantly outperforms existing state-of-the-art metrics,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 534.97,
"r_x1": 286.36,
"r_y1": 534.97,
"r_x2": 286.36,
"r_y2": 526.06,
"r_x3": 70.04,
"r_y3": 526.06,
"coord_origin": "TOPLEFT"
},
"text": "while being much more efficient in training and infer-",
"orig": "while being much more efficient in training and infer-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 546.93,
"r_x1": 161.65,
"r_y1": 546.93,
"r_x2": 161.65,
"r_y2": 538.02,
"r_x3": 70.04,
"r_y3": 538.02,
"coord_origin": "TOPLEFT"
},
"text": "ence to existing works.",
"orig": "ence to existing works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 559.64,
"r": 286.36,
"b": 592.57,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 568.66,
"r_x1": 71.12,
"r_y1": 568.66,
"r_x2": 71.12,
"r_y2": 559.76,
"r_x3": 61.57,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 568.66,
"r_x1": 116.71,
"r_y1": 568.66,
"r_x2": 116.71,
"r_y2": 559.76,
"r_x3": 73.5,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "We present",
"orig": "We present",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 121.58,
"r_y0": 568.59,
"r_x1": 177.68,
"r_y1": 568.59,
"r_x2": 177.68,
"r_y2": 559.64,
"r_x3": 121.58,
"r_y3": 559.64,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.55,
"r_y0": 568.66,
"r_x1": 286.36,
"r_y1": 568.66,
"r_x2": 286.36,
"r_y2": 559.76,
"r_x3": 182.55,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "a synthetically generated",
"orig": "a synthetically generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 580.62,
"r_x1": 286.36,
"r_y1": 580.62,
"r_x2": 286.36,
"r_y2": 571.71,
"r_x3": 70.04,
"r_y3": 571.71,
"coord_origin": "TOPLEFT"
},
"text": "dataset, with various appearance styles and complex-",
"orig": "dataset, with various appearance styles and complex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 592.57,
"r_x1": 82.4,
"r_y1": 592.57,
"r_x2": 82.4,
"r_y2": 583.67,
"r_x3": 70.04,
"r_y3": 583.67,
"coord_origin": "TOPLEFT"
},
"text": "ity.",
"orig": "ity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 605.4,
"r": 286.37,
"b": 638.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.981,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 614.31,
"r_x1": 72.33,
"r_y1": 614.31,
"r_x2": 72.33,
"r_y2": 605.4,
"r_x3": 61.57,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.02,
"r_y0": 614.31,
"r_x1": 286.37,
"r_y1": 614.31,
"r_x2": 286.37,
"r_y2": 605.4,
"r_x3": 75.02,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "An augmented dataset based on PubTabNet [37],",
"orig": "An augmented dataset based on PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 626.26,
"r_x1": 286.36,
"r_y1": 626.26,
"r_x2": 286.36,
"r_y2": 617.36,
"r_x3": 70.04,
"r_y3": 617.36,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] with generated",
"orig": "FinTabNet [36], and TableBank [17] with generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 638.22,
"r_x1": 198.06,
"r_y1": 638.22,
"r_x2": 198.06,
"r_y2": 629.31,
"r_x3": 70.04,
"r_y3": 629.31,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth for reproducibility.",
"orig": "ground-truth for reproducibility.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 650.6,
"r": 286.37,
"b": 695.37,
"coord_origin": "TOPLEFT"
},
"confidence": 0.974,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 659.5,
"r_x1": 286.36,
"r_y1": 659.5,
"r_x2": 286.36,
"r_y2": 650.6,
"r_x3": 62.07,
"r_y3": 650.6,
"coord_origin": "TOPLEFT"
},
"text": "The paper is structured as follows. In Sec. 2, we give",
"orig": "The paper is structured as follows. In Sec. 2, we give",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 671.46,
"r_x1": 286.37,
"r_y1": 671.46,
"r_x2": 286.37,
"r_y2": 662.55,
"r_x3": 50.11,
"r_y3": 662.55,
"coord_origin": "TOPLEFT"
},
"text": "a brief overview of the current state-of-the-art. In Sec. 3,",
"orig": "a brief overview of the current state-of-the-art. In Sec. 3,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 683.41,
"r_x1": 286.37,
"r_y1": 683.41,
"r_x2": 286.37,
"r_y2": 674.51,
"r_x3": 50.11,
"r_y3": 674.51,
"coord_origin": "TOPLEFT"
},
"text": "we describe the datasets on which we train. In Sec. 4, we",
"orig": "we describe the datasets on which we train. In Sec. 4, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 695.37,
"r_x1": 286.37,
"r_y1": 695.37,
"r_x2": 286.37,
"r_y2": 686.46,
"r_x3": 50.11,
"r_y3": 686.46,
"coord_origin": "TOPLEFT"
},
"text": "introduce the TableFormer model-architecture and describe",
"orig": "introduce the TableFormer model-architecture and describe",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "footnote",
"bbox": {
"l": 60.97,
"t": 705.6,
"r": 183.73,
"b": 712.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.895,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.97,
"r_y0": 712.72,
"r_x1": 183.73,
"r_y1": 712.72,
"r_x2": 183.73,
"r_y2": 705.6,
"r_x3": 60.97,
"r_y3": 705.6,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet",
"orig": "$^{1}$https://github.com/IBM/SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.977,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 545.12,
"r_y1": 84.11,
"r_x2": 545.12,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "its results & performance in Sec. 5. As a conclusion, we de-",
"orig": "its results & performance in Sec. 5. As a conclusion, we de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "scribe how this new model-architecture can be re-purposed",
"orig": "scribe how this new model-architecture can be re-purposed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 508.08,
"r_y1": 108.02,
"r_x2": 508.08,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "for other tasks in the computer-vision community.",
"orig": "for other tasks in the computer-vision community.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 121.73,
"r": 498.28,
"b": 132.48,
"coord_origin": "TOPLEFT"
},
"confidence": 0.943,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 132.48,
"r_x1": 315.58,
"r_y1": 132.48,
"r_x2": 315.58,
"r_y2": 121.73,
"r_x3": 308.86,
"r_y3": 121.73,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 324.54,
"r_y0": 132.48,
"r_x1": 498.28,
"r_y1": 132.48,
"r_x2": 498.28,
"r_y2": 121.73,
"r_x3": 324.54,
"r_y3": 121.73,
"coord_origin": "TOPLEFT"
},
"text": "Previous work and State of the Art",
"orig": "Previous work and State of the Art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 142.22,
"r": 545.12,
"b": 330.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 151.13,
"r_x1": 545.11,
"r_y1": 151.13,
"r_x2": 545.11,
"r_y2": 142.22,
"r_x3": 320.82,
"r_y3": 142.22,
"coord_origin": "TOPLEFT"
},
"text": "Identifying the structure of a table has been an outstand-",
"orig": "Identifying the structure of a table has been an outstand-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 163.08,
"r_x1": 545.12,
"r_y1": 163.08,
"r_x2": 545.12,
"r_y2": 154.18,
"r_x3": 308.86,
"r_y3": 154.18,
"coord_origin": "TOPLEFT"
},
"text": "ing problem in the document-parsing community, that mo-",
"orig": "ing problem in the document-parsing community, that mo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 175.04,
"r_x1": 522.56,
"r_y1": 175.04,
"r_x2": 522.56,
"r_y2": 166.13,
"r_x3": 308.86,
"r_y3": 166.13,
"coord_origin": "TOPLEFT"
},
"text": "tivates many organised public challenges [6, 4, 14].",
"orig": "tivates many organised public challenges [6, 4, 14].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 175.04,
"r_x1": 545.12,
"r_y1": 175.04,
"r_x2": 545.12,
"r_y2": 166.13,
"r_x3": 529.62,
"r_y3": 166.13,
"coord_origin": "TOPLEFT"
},
"text": "The",
"orig": "The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 186.99,
"r_x1": 545.12,
"r_y1": 186.99,
"r_x2": 545.12,
"r_y2": 178.09,
"r_x3": 308.86,
"r_y3": 178.09,
"coord_origin": "TOPLEFT"
},
"text": "difficulty of the problem can be attributed to a number of",
"orig": "difficulty of the problem can be attributed to a number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 198.95,
"r_x1": 545.12,
"r_y1": 198.95,
"r_x2": 545.12,
"r_y2": 190.04,
"r_x3": 308.86,
"r_y3": 190.04,
"coord_origin": "TOPLEFT"
},
"text": "factors. First, there is a large variety in the shapes and sizes",
"orig": "factors. First, there is a large variety in the shapes and sizes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 210.9,
"r_x1": 346.98,
"r_y1": 210.9,
"r_x2": 346.98,
"r_y2": 202.0,
"r_x3": 308.86,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "of tables.",
"orig": "of tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.87,
"r_y0": 210.9,
"r_x1": 545.12,
"r_y1": 210.9,
"r_x2": 545.12,
"r_y2": 202.0,
"r_x3": 354.87,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "Such large variety requires a flexible method.",
"orig": "Such large variety requires a flexible method.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 222.86,
"r_x1": 545.12,
"r_y1": 222.86,
"r_x2": 545.12,
"r_y2": 213.95,
"r_x3": 308.86,
"r_y3": 213.95,
"coord_origin": "TOPLEFT"
},
"text": "This is especially true for complex column- and row head-",
"orig": "This is especially true for complex column- and row head-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 234.81,
"r_x1": 530.92,
"r_y1": 234.81,
"r_x2": 530.92,
"r_y2": 225.91,
"r_x3": 308.86,
"r_y3": 225.91,
"coord_origin": "TOPLEFT"
},
"text": "ers, which can be extremely intricate and demanding.",
"orig": "ers, which can be extremely intricate and demanding.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.92,
"r_y0": 234.81,
"r_x1": 545.12,
"r_y1": 234.81,
"r_x2": 545.12,
"r_y2": 225.91,
"r_x3": 537.92,
"r_y3": 225.91,
"coord_origin": "TOPLEFT"
},
"text": "A",
"orig": "A",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 246.77,
"r_x1": 545.12,
"r_y1": 246.77,
"r_x2": 545.12,
"r_y2": 237.86,
"r_x3": 308.86,
"r_y3": 237.86,
"coord_origin": "TOPLEFT"
},
"text": "second factor of complexity is the lack of data with regard",
"orig": "second factor of complexity is the lack of data with regard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.72,
"r_x1": 545.12,
"r_y1": 258.72,
"r_x2": 545.12,
"r_y2": 249.82,
"r_x3": 308.86,
"r_y3": 249.82,
"coord_origin": "TOPLEFT"
},
"text": "to table-structure. Until the publication of PubTabNet [37],",
"orig": "to table-structure. Until the publication of PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.68,
"r_x1": 439.84,
"r_y1": 270.68,
"r_x2": 439.84,
"r_y2": 261.77,
"r_x3": 308.86,
"r_y3": 261.77,
"coord_origin": "TOPLEFT"
},
"text": "there were no large datasets (i.e.",
"orig": "there were no large datasets (i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.44,
"r_y0": 270.46,
"r_x1": 452.19,
"r_y1": 270.46,
"r_x2": 452.19,
"r_y2": 261.61,
"r_x3": 444.44,
"r_y3": 261.61,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.89,
"r_y0": 270.46,
"r_x1": 470.83,
"r_y1": 270.46,
"r_x2": 470.83,
"r_y2": 261.61,
"r_x3": 455.89,
"r_y3": 261.61,
"coord_origin": "TOPLEFT"
},
"text": "100",
"orig": "100",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 470.83,
"r_y0": 270.68,
"r_x1": 545.12,
"r_y1": 270.68,
"r_x2": 545.12,
"r_y2": 261.77,
"r_x3": 470.83,
"r_y3": 261.77,
"coord_origin": "TOPLEFT"
},
"text": "K tables) that pro-",
"orig": "K tables) that pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.63,
"r_x1": 545.12,
"r_y1": 282.63,
"r_x2": 545.12,
"r_y2": 273.73,
"r_x3": 308.86,
"r_y3": 273.73,
"coord_origin": "TOPLEFT"
},
"text": "vided structure information. This happens primarily due to",
"orig": "vided structure information. This happens primarily due to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.59,
"r_x1": 545.12,
"r_y1": 294.59,
"r_x2": 545.12,
"r_y2": 285.68,
"r_x3": 308.86,
"r_y3": 285.68,
"coord_origin": "TOPLEFT"
},
"text": "the fact that tables are notoriously time-consuming to an-",
"orig": "the fact that tables are notoriously time-consuming to an-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 306.55,
"r_x1": 545.12,
"r_y1": 306.55,
"r_x2": 545.12,
"r_y2": 297.64,
"r_x3": 308.86,
"r_y3": 297.64,
"coord_origin": "TOPLEFT"
},
"text": "notate by hand. However, this has definitely changed in re-",
"orig": "notate by hand. However, this has definitely changed in re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 318.5,
"r_x1": 545.12,
"r_y1": 318.5,
"r_x2": 545.12,
"r_y2": 309.59,
"r_x3": 308.86,
"r_y3": 309.59,
"coord_origin": "TOPLEFT"
},
"text": "cent years with the deliverance of PubTabNet [37], FinTab-",
"orig": "cent years with the deliverance of PubTabNet [37], FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 330.46,
"r_x1": 425.92,
"r_y1": 330.46,
"r_x2": 425.92,
"r_y2": 321.55,
"r_x3": 308.86,
"r_y3": 321.55,
"coord_origin": "TOPLEFT"
},
"text": "Net [36], TableBank [17] etc.",
"orig": "Net [36], TableBank [17] etc.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 333.57,
"r": 545.12,
"b": 450.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 342.48,
"r_x1": 545.11,
"r_y1": 342.48,
"r_x2": 545.11,
"r_y2": 333.57,
"r_x3": 320.82,
"r_y3": 333.57,
"coord_origin": "TOPLEFT"
},
"text": "Before the rising popularity of deep neural networks,",
"orig": "Before the rising popularity of deep neural networks,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 354.43,
"r_x1": 545.11,
"r_y1": 354.43,
"r_x2": 545.11,
"r_y2": 345.52,
"r_x3": 308.86,
"r_y3": 345.52,
"coord_origin": "TOPLEFT"
},
"text": "the community relied heavily on heuristic and/or statistical",
"orig": "the community relied heavily on heuristic and/or statistical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 366.39,
"r_x1": 545.12,
"r_y1": 366.39,
"r_x2": 545.12,
"r_y2": 357.48,
"r_x3": 308.86,
"r_y3": 357.48,
"coord_origin": "TOPLEFT"
},
"text": "methods to do table structure identification [3, 7, 11, 5, 13,",
"orig": "methods to do table structure identification [3, 7, 11, 5, 13,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 378.34,
"r_x1": 545.12,
"r_y1": 378.34,
"r_x2": 545.12,
"r_y2": 369.44,
"r_x3": 308.86,
"r_y3": 369.44,
"coord_origin": "TOPLEFT"
},
"text": "28]. Although such methods work well on constrained ta-",
"orig": "28]. Although such methods work well on constrained ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 390.3,
"r_x1": 545.12,
"r_y1": 390.3,
"r_x2": 545.12,
"r_y2": 381.39,
"r_x3": 308.86,
"r_y3": 381.39,
"coord_origin": "TOPLEFT"
},
"text": "bles [12], a more data-driven approach can be applied due",
"orig": "bles [12], a more data-driven approach can be applied due",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 402.25,
"r_x1": 545.12,
"r_y1": 402.25,
"r_x2": 545.12,
"r_y2": 393.35,
"r_x3": 308.86,
"r_y3": 393.35,
"coord_origin": "TOPLEFT"
},
"text": "to the advent of convolutional neural networks (CNNs) and",
"orig": "to the advent of convolutional neural networks (CNNs) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 414.21,
"r_x1": 545.12,
"r_y1": 414.21,
"r_x2": 545.12,
"r_y2": 405.3,
"r_x3": 308.86,
"r_y3": 405.3,
"coord_origin": "TOPLEFT"
},
"text": "the availability of large datasets. To the best-of-our knowl-",
"orig": "the availability of large datasets. To the best-of-our knowl-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 426.16,
"r_x1": 545.12,
"r_y1": 426.16,
"r_x2": 545.12,
"r_y2": 417.26,
"r_x3": 308.86,
"r_y3": 417.26,
"coord_origin": "TOPLEFT"
},
"text": "edge, there are currently two different types of network ar-",
"orig": "edge, there are currently two different types of network ar-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 438.12,
"r_x1": 545.12,
"r_y1": 438.12,
"r_x2": 545.12,
"r_y2": 429.21,
"r_x3": 308.86,
"r_y3": 429.21,
"coord_origin": "TOPLEFT"
},
"text": "chitecture that are being pursued for state-of-the-art table-",
"orig": "chitecture that are being pursued for state-of-the-art table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 450.07,
"r_x1": 401.29,
"r_y1": 450.07,
"r_x2": 401.29,
"r_y2": 441.17,
"r_x3": 308.86,
"r_y3": 441.17,
"coord_origin": "TOPLEFT"
},
"text": "structure identification.",
"orig": "structure identification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 453.07,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 462.02,
"r_x1": 423.26,
"r_y1": 462.02,
"r_x2": 423.26,
"r_y2": 453.07,
"r_x3": 320.82,
"r_y3": 453.07,
"coord_origin": "TOPLEFT"
},
"text": "Image-to-Text networks",
"orig": "Image-to-Text networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.27,
"r_y0": 462.09,
"r_x1": 545.11,
"r_y1": 462.09,
"r_x2": 545.11,
"r_y2": 453.19,
"r_x3": 423.27,
"r_y3": 453.19,
"coord_origin": "TOPLEFT"
},
"text": ": In this type of network, one",
"orig": ": In this type of network, one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 474.05,
"r_x1": 545.12,
"r_y1": 474.05,
"r_x2": 545.12,
"r_y2": 465.14,
"r_x3": 308.86,
"r_y3": 465.14,
"coord_origin": "TOPLEFT"
},
"text": "predicts a sequence of tokens starting from an encoded",
"orig": "predicts a sequence of tokens starting from an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 486.0,
"r_x1": 335.7,
"r_y1": 486.0,
"r_x2": 335.7,
"r_y2": 477.1,
"r_x3": 308.86,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.85,
"r_y0": 486.0,
"r_x1": 545.12,
"r_y1": 486.0,
"r_x2": 545.12,
"r_y2": 477.1,
"r_x3": 345.85,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "Such sequences of tokens can be HTML table",
"orig": "Such sequences of tokens can be HTML table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.96,
"r_x1": 545.11,
"r_y1": 497.96,
"r_x2": 545.11,
"r_y2": 489.05,
"r_x3": 308.86,
"r_y3": 489.05,
"coord_origin": "TOPLEFT"
},
"text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.91,
"r_x1": 545.11,
"r_y1": 509.91,
"r_x2": 545.11,
"r_y2": 501.01,
"r_x3": 308.86,
"r_y3": 501.01,
"coord_origin": "TOPLEFT"
},
"text": "bols is ultimately not very important, since one can be trans-",
"orig": "bols is ultimately not very important, since one can be trans-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.87,
"r_x1": 545.12,
"r_y1": 521.87,
"r_x2": 545.12,
"r_y2": 512.96,
"r_x3": 308.86,
"r_y3": 512.96,
"coord_origin": "TOPLEFT"
},
"text": "formed into the other. There are however subtle variations",
"orig": "formed into the other. There are however subtle variations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.82,
"r_x1": 545.12,
"r_y1": 533.82,
"r_x2": 545.12,
"r_y2": 524.92,
"r_x3": 308.86,
"r_y3": 524.92,
"coord_origin": "TOPLEFT"
},
"text": "in the Image-to-Text networks. The easiest network archi-",
"orig": "in the Image-to-Text networks. The easiest network archi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.78,
"r_x1": 420.94,
"r_y1": 545.78,
"r_x2": 420.94,
"r_y2": 536.87,
"r_x3": 308.86,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "tectures are \u201cimage-encoder",
"orig": "tectures are \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.59,
"r_y0": 545.56,
"r_x1": 433.56,
"r_y1": 545.56,
"r_x2": 433.56,
"r_y2": 536.16,
"r_x3": 423.59,
"r_y3": 536.16,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.21,
"r_y0": 545.78,
"r_x1": 545.11,
"r_y1": 545.78,
"r_x2": 545.11,
"r_y2": 536.87,
"r_x3": 436.21,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "text-decoder\u201d (IETD), sim-",
"orig": "text-decoder\u201d (IETD), sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.73,
"r_x1": 545.12,
"r_y1": 557.73,
"r_x2": 545.12,
"r_y2": 548.83,
"r_x3": 308.86,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "ilar to network architectures that try to provide captions to",
"orig": "ilar to network architectures that try to provide captions to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.69,
"r_x1": 545.11,
"r_y1": 569.69,
"r_x2": 545.11,
"r_y2": 560.78,
"r_x3": 308.86,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "images [32]. In these IETD networks, one expects as output",
"orig": "images [32]. In these IETD networks, one expects as output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.64,
"r_x1": 545.11,
"r_y1": 581.64,
"r_x2": 545.11,
"r_y2": 572.74,
"r_x3": 308.86,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"orig": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.6,
"r_x1": 545.12,
"r_y1": 593.6,
"r_x2": 545.12,
"r_y2": 584.69,
"r_x3": 308.86,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "bols necessary for creating the table with the content of the",
"orig": "bols necessary for creating the table with the content of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.56,
"r_x1": 497.08,
"r_y1": 605.56,
"r_x2": 497.08,
"r_y2": 596.65,
"r_x3": 308.86,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "table. Another approach is the \u201cimage-encoder",
"orig": "table. Another approach is the \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.8,
"r_y0": 605.34,
"r_x1": 509.77,
"r_y1": 605.34,
"r_x2": 509.77,
"r_y2": 595.93,
"r_x3": 499.8,
"r_y3": 595.93,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.5,
"r_y0": 605.56,
"r_x1": 545.11,
"r_y1": 605.56,
"r_x2": 545.11,
"r_y2": 596.65,
"r_x3": 512.5,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "dual de-",
"orig": "dual de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.51,
"r_x1": 545.12,
"r_y1": 617.51,
"r_x2": 545.12,
"r_y2": 608.6,
"r_x3": 308.86,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "coder\u201d (IEDD) networks. In these type of networks, one has",
"orig": "coder\u201d (IEDD) networks. In these type of networks, one has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.47,
"r_x1": 545.12,
"r_y1": 629.47,
"r_x2": 545.12,
"r_y2": 620.56,
"r_x3": 308.86,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "two consecutive decoders with different purposes. The first",
"orig": "two consecutive decoders with different purposes. The first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.42,
"r_x1": 364.78,
"r_y1": 641.42,
"r_x2": 364.78,
"r_y2": 632.51,
"r_x3": 308.86,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "decoder is the",
"orig": "decoder is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.57,
"r_y0": 641.19,
"r_x1": 415.61,
"r_y1": 641.19,
"r_x2": 415.61,
"r_y2": 632.6,
"r_x3": 367.57,
"r_y3": 632.6,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.61,
"r_y0": 641.42,
"r_x1": 545.12,
"r_y1": 641.42,
"r_x2": 545.12,
"r_y2": 632.51,
"r_x3": 415.61,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": ", i.e. it only produces the HTM-",
"orig": ", i.e. it only produces the HTM-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.38,
"r_x1": 545.12,
"r_y1": 653.38,
"r_x2": 545.12,
"r_y2": 644.47,
"r_x3": 308.86,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "L/LaTeX tags which construct an empty table. The second",
"orig": "L/LaTeX tags which construct an empty table. The second",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.1,
"r_x1": 373.6,
"r_y1": 665.1,
"r_x2": 373.6,
"r_y2": 656.51,
"r_x3": 308.86,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "content-decoder",
"orig": "content-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.91,
"r_y0": 665.33,
"r_x1": 545.12,
"r_y1": 665.33,
"r_x2": 545.12,
"r_y2": 656.43,
"r_x3": 376.91,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "uses the encoding of the image in combi-",
"orig": "uses the encoding of the image in combi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.12,
"r_y1": 677.29,
"r_x2": 545.12,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "nation with the output encoding of each cell-tag (from the",
"orig": "nation with the output encoding of each cell-tag (from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.01,
"r_x1": 356.9,
"r_y1": 689.01,
"r_x2": 356.9,
"r_y2": 680.42,
"r_x3": 308.86,
"r_y3": 680.42,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.13,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 357.13,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": ") to generate the textual content of each table",
"orig": ") to generate the textual content of each table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "cell. The network architecture of IEDD is certainly more",
"orig": "cell. The network architecture of IEDD is certainly more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "elaborate, but it has the advantage that one can pre-train the",
"orig": "elaborate, but it has the advantage that one can pre-train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.878,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 12,
"page_no": 1,
"cluster": {
"id": 12,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 96.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.966,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "considered as a solved problem, given enough ground-truth",
"orig": "considered as a solved problem, given enough ground-truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 112.65,
"r_y1": 96.07,
"r_x2": 112.65,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "data to train on.",
"orig": "data to train on.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "considered as a solved problem, given enough ground-truth data to train on."
},
{
"label": "text",
"id": 4,
"page_no": 1,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 99.57,
"r": 286.37,
"b": 228.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 108.48,
"r_x1": 286.36,
"r_y1": 108.48,
"r_x2": 286.36,
"r_y2": 99.57,
"r_x3": 62.07,
"r_y3": 99.57,
"coord_origin": "TOPLEFT"
},
"text": "The second problem is called table-structure decompo-",
"orig": "The second problem is called table-structure decompo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 120.43,
"r_x1": 74.75,
"r_y1": 120.43,
"r_x2": 74.75,
"r_y2": 111.53,
"r_x3": 50.11,
"r_y3": 111.53,
"coord_origin": "TOPLEFT"
},
"text": "sition.",
"orig": "sition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.33,
"r_y0": 120.43,
"r_x1": 286.37,
"r_y1": 120.43,
"r_x2": 286.37,
"r_y2": 111.53,
"r_x3": 81.33,
"r_y3": 111.53,
"coord_origin": "TOPLEFT"
},
"text": "The latter is a long standing problem in the com-",
"orig": "The latter is a long standing problem in the com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 132.39,
"r_x1": 286.37,
"r_y1": 132.39,
"r_x2": 286.37,
"r_y2": 123.48,
"r_x3": 50.11,
"r_y3": 123.48,
"coord_origin": "TOPLEFT"
},
"text": "munity of document understanding [6, 4, 14]. Contrary to",
"orig": "munity of document understanding [6, 4, 14]. Contrary to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 144.34,
"r_x1": 286.37,
"r_y1": 144.34,
"r_x2": 286.37,
"r_y2": 135.44,
"r_x3": 50.11,
"r_y3": 135.44,
"coord_origin": "TOPLEFT"
},
"text": "the table-location problem, there are no commonly used ap-",
"orig": "the table-location problem, there are no commonly used ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 156.3,
"r_x1": 286.37,
"r_y1": 156.3,
"r_x2": 286.37,
"r_y2": 147.39,
"r_x3": 50.11,
"r_y3": 147.39,
"coord_origin": "TOPLEFT"
},
"text": "proaches that can easily be re-purposed to solve this prob-",
"orig": "proaches that can easily be re-purposed to solve this prob-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 168.25,
"r_x1": 286.37,
"r_y1": 168.25,
"r_x2": 286.37,
"r_y2": 159.35,
"r_x3": 50.11,
"r_y3": 159.35,
"coord_origin": "TOPLEFT"
},
"text": "lem. Lately, a set of new model-architectures has been pro-",
"orig": "lem. Lately, a set of new model-architectures has been pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 180.21,
"r_x1": 286.37,
"r_y1": 180.21,
"r_x2": 286.37,
"r_y2": 171.3,
"r_x3": 50.11,
"r_y3": 171.3,
"coord_origin": "TOPLEFT"
},
"text": "posed by the community to address table-structure decom-",
"orig": "posed by the community to address table-structure decom-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 192.16,
"r_x1": 286.37,
"r_y1": 192.16,
"r_x2": 286.37,
"r_y2": 183.26,
"r_x3": 50.11,
"r_y3": 183.26,
"coord_origin": "TOPLEFT"
},
"text": "position [37, 36, 18, 20]. All these models have some weak-",
"orig": "position [37, 36, 18, 20]. All these models have some weak-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 204.12,
"r_x1": 286.37,
"r_y1": 204.12,
"r_x2": 286.37,
"r_y2": 195.21,
"r_x3": 50.11,
"r_y3": 195.21,
"coord_origin": "TOPLEFT"
},
"text": "nesses (see Sec. 2). The common denominator here is the",
"orig": "nesses (see Sec. 2). The common denominator here is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 216.07,
"r_x1": 286.37,
"r_y1": 216.07,
"r_x2": 286.37,
"r_y2": 207.17,
"r_x3": 50.11,
"r_y3": 207.17,
"coord_origin": "TOPLEFT"
},
"text": "reliance on textual features and/or the inability to provide",
"orig": "reliance on textual features and/or the inability to provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 228.03,
"r_x1": 278.66,
"r_y1": 228.03,
"r_x2": 278.66,
"r_y2": 219.12,
"r_x3": 50.11,
"r_y3": 219.12,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table-cell in the original image.",
"orig": "the bounding box of each table-cell in the original image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image."
},
{
"label": "text",
"id": 2,
"page_no": 1,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 231.53,
"r": 286.37,
"b": 371.95,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 240.44,
"r_x1": 286.36,
"r_y1": 240.44,
"r_x2": 286.36,
"r_y2": 231.53,
"r_x3": 62.07,
"r_y3": 231.53,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we want to address these weaknesses and",
"orig": "In this paper, we want to address these weaknesses and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 252.39,
"r_x1": 286.37,
"r_y1": 252.39,
"r_x2": 286.37,
"r_y2": 243.49,
"r_x3": 50.11,
"r_y3": 243.49,
"coord_origin": "TOPLEFT"
},
"text": "present a robust table-structure decomposition algorithm.",
"orig": "present a robust table-structure decomposition algorithm.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.35,
"r_x1": 286.37,
"r_y1": 264.35,
"r_x2": 286.37,
"r_y2": 255.44,
"r_x3": 50.11,
"r_y3": 255.44,
"coord_origin": "TOPLEFT"
},
"text": "The design criteria for our model are the following. First,",
"orig": "The design criteria for our model are the following. First,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.3,
"r_x1": 286.37,
"r_y1": 276.3,
"r_x2": 286.37,
"r_y2": 267.4,
"r_x3": 50.11,
"r_y3": 267.4,
"coord_origin": "TOPLEFT"
},
"text": "we want our algorithm to be language agnostic. In this way,",
"orig": "we want our algorithm to be language agnostic. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.26,
"r_x1": 286.37,
"r_y1": 288.26,
"r_x2": 286.37,
"r_y2": 279.35,
"r_x3": 50.11,
"r_y3": 279.35,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the structure of any table, irregardless of the",
"orig": "we can obtain the structure of any table, irregardless of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.21,
"r_x1": 88.57,
"r_y1": 300.21,
"r_x2": 88.57,
"r_y2": 291.31,
"r_x3": 50.11,
"r_y3": 291.31,
"coord_origin": "TOPLEFT"
},
"text": "language.",
"orig": "language.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 95.5,
"r_y0": 300.21,
"r_x1": 286.37,
"r_y1": 300.21,
"r_x2": 286.37,
"r_y2": 291.31,
"r_x3": 95.5,
"r_y3": 291.31,
"coord_origin": "TOPLEFT"
},
"text": "Second, we want our algorithm to leverage as",
"orig": "Second, we want our algorithm to leverage as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.17,
"r_x1": 286.37,
"r_y1": 312.17,
"r_x2": 286.37,
"r_y2": 303.26,
"r_x3": 50.11,
"r_y3": 303.26,
"coord_origin": "TOPLEFT"
},
"text": "much data as possible from the original PDF document. For",
"orig": "much data as possible from the original PDF document. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.12,
"r_x1": 286.37,
"r_y1": 324.12,
"r_x2": 286.37,
"r_y2": 315.22,
"r_x3": 50.11,
"r_y3": 315.22,
"coord_origin": "TOPLEFT"
},
"text": "programmatic PDF documents, the text-cells can often be",
"orig": "programmatic PDF documents, the text-cells can often be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.08,
"r_x1": 286.37,
"r_y1": 336.08,
"r_x2": 286.37,
"r_y2": 327.17,
"r_x3": 50.11,
"r_y3": 327.17,
"coord_origin": "TOPLEFT"
},
"text": "extracted much faster and with higher accuracy compared",
"orig": "extracted much faster and with higher accuracy compared",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.03,
"r_x1": 286.37,
"r_y1": 348.03,
"r_x2": 286.37,
"r_y2": 339.13,
"r_x3": 50.11,
"r_y3": 339.13,
"coord_origin": "TOPLEFT"
},
"text": "to OCR methods. Last but not least, we want to have a di-",
"orig": "to OCR methods. Last but not least, we want to have a di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.99,
"r_x1": 286.37,
"r_y1": 359.99,
"r_x2": 286.37,
"r_y2": 351.08,
"r_x3": 50.11,
"r_y3": 351.08,
"coord_origin": "TOPLEFT"
},
"text": "rect link between the table-cell and its bounding box in the",
"orig": "rect link between the table-cell and its bounding box in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.95,
"r_x1": 76.95,
"r_y1": 371.95,
"r_x2": 76.95,
"r_y2": 363.04,
"r_x3": 50.11,
"r_y3": 363.04,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image."
},
{
"label": "text",
"id": 7,
"page_no": 1,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 375.45,
"r": 286.37,
"b": 432.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 384.35,
"r_x1": 286.36,
"r_y1": 384.35,
"r_x2": 286.36,
"r_y2": 375.45,
"r_x3": 62.07,
"r_y3": 375.45,
"coord_origin": "TOPLEFT"
},
"text": "To meet the design criteria listed above, we developed a",
"orig": "To meet the design criteria listed above, we developed a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.31,
"r_x1": 120.99,
"r_y1": 396.31,
"r_x2": 120.99,
"r_y2": 387.4,
"r_x3": 50.11,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "new model called",
"orig": "new model called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 123.9,
"r_y0": 396.24,
"r_x1": 179.73,
"r_y1": 396.24,
"r_x2": 179.73,
"r_y2": 387.28,
"r_x3": 123.9,
"r_y3": 387.28,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.65,
"r_y0": 396.31,
"r_x1": 286.37,
"r_y1": 396.31,
"r_x2": 286.37,
"r_y2": 387.4,
"r_x3": 182.65,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "and a synthetically gener-",
"orig": "and a synthetically gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 408.26,
"r_x1": 181.76,
"r_y1": 408.26,
"r_x2": 181.76,
"r_y2": 399.36,
"r_x3": 50.11,
"r_y3": 399.36,
"coord_origin": "TOPLEFT"
},
"text": "ated table structure dataset called",
"orig": "ated table structure dataset called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.1,
"r_y0": 408.19,
"r_x1": 240.2,
"r_y1": 408.19,
"r_x2": 240.2,
"r_y2": 399.24,
"r_x3": 184.1,
"r_y3": 399.24,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.2,
"r_y0": 408.26,
"r_x1": 286.36,
"r_y1": 408.26,
"r_x2": 286.36,
"r_y2": 399.36,
"r_x3": 240.2,
"r_y3": 399.36,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$. In partic-",
"orig": "$^{1}$. In partic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 420.22,
"r_x1": 286.37,
"r_y1": 420.22,
"r_x2": 286.37,
"r_y2": 411.31,
"r_x3": 50.11,
"r_y3": 411.31,
"coord_origin": "TOPLEFT"
},
"text": "ular, our contributions in this work can be summarised as",
"orig": "ular, our contributions in this work can be summarised as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 432.17,
"r_x1": 82.52,
"r_y1": 432.17,
"r_x2": 82.52,
"r_y2": 423.27,
"r_x3": 50.11,
"r_y3": 423.27,
"coord_origin": "TOPLEFT"
},
"text": "follows:",
"orig": "follows:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet $^{1}$. In particular, our contributions in this work can be summarised as follows:"
},
{
"label": "list_item",
"id": 6,
"page_no": 1,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 444.43,
"r": 286.36,
"b": 489.32,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 453.46,
"r_x1": 70.74,
"r_y1": 453.46,
"r_x2": 70.74,
"r_y2": 444.55,
"r_x3": 61.57,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.03,
"r_y0": 453.46,
"r_x1": 117.1,
"r_y1": 453.46,
"r_x2": 117.1,
"r_y2": 444.55,
"r_x3": 73.03,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": "We propose",
"orig": "We propose",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.59,
"r_y0": 453.39,
"r_x1": 175.42,
"r_y1": 453.39,
"r_x2": 175.42,
"r_y2": 444.43,
"r_x3": 119.59,
"r_y3": 444.43,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.42,
"r_y0": 453.46,
"r_x1": 286.36,
"r_y1": 453.46,
"r_x2": 286.36,
"r_y2": 444.55,
"r_x3": 175.42,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": ", a transformer based model",
"orig": ", a transformer based model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 465.41,
"r_x1": 286.36,
"r_y1": 465.41,
"r_x2": 286.36,
"r_y2": 456.51,
"r_x3": 70.04,
"r_y3": 456.51,
"coord_origin": "TOPLEFT"
},
"text": "that predicts tables structure and bounding boxes for",
"orig": "that predicts tables structure and bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 477.37,
"r_x1": 286.36,
"r_y1": 477.37,
"r_x2": 286.36,
"r_y2": 468.46,
"r_x3": 70.04,
"r_y3": 468.46,
"coord_origin": "TOPLEFT"
},
"text": "the table content simultaneously in an end-to-end ap-",
"orig": "the table content simultaneously in an end-to-end ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 489.32,
"r_x1": 99.64,
"r_y1": 489.32,
"r_x2": 99.64,
"r_y2": 480.42,
"r_x3": 70.04,
"r_y3": 480.42,
"coord_origin": "TOPLEFT"
},
"text": "proach.",
"orig": "proach.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach."
},
{
"label": "list_item",
"id": 5,
"page_no": 1,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 502.03,
"r": 286.36,
"b": 546.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 511.06,
"r_x1": 71.62,
"r_y1": 511.06,
"r_x2": 71.62,
"r_y2": 502.15,
"r_x3": 61.57,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.13,
"r_y0": 511.06,
"r_x1": 196.1,
"r_y1": 511.06,
"r_x2": 196.1,
"r_y2": 502.15,
"r_x3": 74.13,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "Across all benchmark datasets",
"orig": "Across all benchmark datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.31,
"r_y0": 510.99,
"r_x1": 256.14,
"r_y1": 510.99,
"r_x2": 256.14,
"r_y2": 502.03,
"r_x3": 200.31,
"r_y3": 502.03,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.35,
"r_y0": 511.06,
"r_x1": 286.36,
"r_y1": 511.06,
"r_x2": 286.36,
"r_y2": 502.15,
"r_x3": 260.35,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "signif-",
"orig": "signif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 523.01,
"r_x1": 286.36,
"r_y1": 523.01,
"r_x2": 286.36,
"r_y2": 514.11,
"r_x3": 70.04,
"r_y3": 514.11,
"coord_origin": "TOPLEFT"
},
"text": "icantly outperforms existing state-of-the-art metrics,",
"orig": "icantly outperforms existing state-of-the-art metrics,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 534.97,
"r_x1": 286.36,
"r_y1": 534.97,
"r_x2": 286.36,
"r_y2": 526.06,
"r_x3": 70.04,
"r_y3": 526.06,
"coord_origin": "TOPLEFT"
},
"text": "while being much more efficient in training and infer-",
"orig": "while being much more efficient in training and infer-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 546.93,
"r_x1": 161.65,
"r_y1": 546.93,
"r_x2": 161.65,
"r_y2": 538.02,
"r_x3": 70.04,
"r_y3": 538.02,
"coord_origin": "TOPLEFT"
},
"text": "ence to existing works.",
"orig": "ence to existing works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works."
},
{
"label": "list_item",
"id": 9,
"page_no": 1,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 559.64,
"r": 286.36,
"b": 592.57,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 568.66,
"r_x1": 71.12,
"r_y1": 568.66,
"r_x2": 71.12,
"r_y2": 559.76,
"r_x3": 61.57,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 568.66,
"r_x1": 116.71,
"r_y1": 568.66,
"r_x2": 116.71,
"r_y2": 559.76,
"r_x3": 73.5,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "We present",
"orig": "We present",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 121.58,
"r_y0": 568.59,
"r_x1": 177.68,
"r_y1": 568.59,
"r_x2": 177.68,
"r_y2": 559.64,
"r_x3": 121.58,
"r_y3": 559.64,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.55,
"r_y0": 568.66,
"r_x1": 286.36,
"r_y1": 568.66,
"r_x2": 286.36,
"r_y2": 559.76,
"r_x3": 182.55,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "a synthetically generated",
"orig": "a synthetically generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 580.62,
"r_x1": 286.36,
"r_y1": 580.62,
"r_x2": 286.36,
"r_y2": 571.71,
"r_x3": 70.04,
"r_y3": 571.71,
"coord_origin": "TOPLEFT"
},
"text": "dataset, with various appearance styles and complex-",
"orig": "dataset, with various appearance styles and complex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 592.57,
"r_x1": 82.4,
"r_y1": 592.57,
"r_x2": 82.4,
"r_y2": 583.67,
"r_x3": 70.04,
"r_y3": 583.67,
"coord_origin": "TOPLEFT"
},
"text": "ity.",
"orig": "ity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity."
},
{
"label": "list_item",
"id": 8,
"page_no": 1,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 605.4,
"r": 286.37,
"b": 638.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.981,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 614.31,
"r_x1": 72.33,
"r_y1": 614.31,
"r_x2": 72.33,
"r_y2": 605.4,
"r_x3": 61.57,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.02,
"r_y0": 614.31,
"r_x1": 286.37,
"r_y1": 614.31,
"r_x2": 286.37,
"r_y2": 605.4,
"r_x3": 75.02,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "An augmented dataset based on PubTabNet [37],",
"orig": "An augmented dataset based on PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 626.26,
"r_x1": 286.36,
"r_y1": 626.26,
"r_x2": 286.36,
"r_y2": 617.36,
"r_x3": 70.04,
"r_y3": 617.36,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] with generated",
"orig": "FinTabNet [36], and TableBank [17] with generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 638.22,
"r_x1": 198.06,
"r_y1": 638.22,
"r_x2": 198.06,
"r_y2": 629.31,
"r_x3": 70.04,
"r_y3": 629.31,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth for reproducibility.",
"orig": "ground-truth for reproducibility.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility."
},
{
"label": "text",
"id": 11,
"page_no": 1,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 650.6,
"r": 286.37,
"b": 695.37,
"coord_origin": "TOPLEFT"
},
"confidence": 0.974,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 659.5,
"r_x1": 286.36,
"r_y1": 659.5,
"r_x2": 286.36,
"r_y2": 650.6,
"r_x3": 62.07,
"r_y3": 650.6,
"coord_origin": "TOPLEFT"
},
"text": "The paper is structured as follows. In Sec. 2, we give",
"orig": "The paper is structured as follows. In Sec. 2, we give",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 671.46,
"r_x1": 286.37,
"r_y1": 671.46,
"r_x2": 286.37,
"r_y2": 662.55,
"r_x3": 50.11,
"r_y3": 662.55,
"coord_origin": "TOPLEFT"
},
"text": "a brief overview of the current state-of-the-art. In Sec. 3,",
"orig": "a brief overview of the current state-of-the-art. In Sec. 3,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 683.41,
"r_x1": 286.37,
"r_y1": 683.41,
"r_x2": 286.37,
"r_y2": 674.51,
"r_x3": 50.11,
"r_y3": 674.51,
"coord_origin": "TOPLEFT"
},
"text": "we describe the datasets on which we train. In Sec. 4, we",
"orig": "we describe the datasets on which we train. In Sec. 4, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 695.37,
"r_x1": 286.37,
"r_y1": 695.37,
"r_x2": 286.37,
"r_y2": 686.46,
"r_x3": 50.11,
"r_y3": 686.46,
"coord_origin": "TOPLEFT"
},
"text": "introduce the TableFormer model-architecture and describe",
"orig": "introduce the TableFormer model-architecture and describe",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe"
},
{
"label": "footnote",
"id": 14,
"page_no": 1,
"cluster": {
"id": 14,
"label": "footnote",
"bbox": {
"l": 60.97,
"t": 705.6,
"r": 183.73,
"b": 712.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.895,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.97,
"r_y0": 712.72,
"r_x1": 183.73,
"r_y1": 712.72,
"r_x2": 183.73,
"r_y2": 705.6,
"r_x3": 60.97,
"r_y3": 705.6,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet",
"orig": "$^{1}$https://github.com/IBM/SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet"
},
{
"label": "text",
"id": 10,
"page_no": 1,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.977,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 545.12,
"r_y1": 84.11,
"r_x2": 545.12,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "its results & performance in Sec. 5. As a conclusion, we de-",
"orig": "its results & performance in Sec. 5. As a conclusion, we de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "scribe how this new model-architecture can be re-purposed",
"orig": "scribe how this new model-architecture can be re-purposed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 508.08,
"r_y1": 108.02,
"r_x2": 508.08,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "for other tasks in the computer-vision community.",
"orig": "for other tasks in the computer-vision community.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "its results & performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community."
},
{
"label": "section_header",
"id": 13,
"page_no": 1,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 121.73,
"r": 498.28,
"b": 132.48,
"coord_origin": "TOPLEFT"
},
"confidence": 0.943,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 132.48,
"r_x1": 315.58,
"r_y1": 132.48,
"r_x2": 315.58,
"r_y2": 121.73,
"r_x3": 308.86,
"r_y3": 121.73,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 324.54,
"r_y0": 132.48,
"r_x1": 498.28,
"r_y1": 132.48,
"r_x2": 498.28,
"r_y2": 121.73,
"r_x3": 324.54,
"r_y3": 121.73,
"coord_origin": "TOPLEFT"
},
"text": "Previous work and State of the Art",
"orig": "Previous work and State of the Art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Previous work and State of the Art"
},
{
"label": "text",
"id": 0,
"page_no": 1,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 142.22,
"r": 545.12,
"b": 330.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 151.13,
"r_x1": 545.11,
"r_y1": 151.13,
"r_x2": 545.11,
"r_y2": 142.22,
"r_x3": 320.82,
"r_y3": 142.22,
"coord_origin": "TOPLEFT"
},
"text": "Identifying the structure of a table has been an outstand-",
"orig": "Identifying the structure of a table has been an outstand-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 163.08,
"r_x1": 545.12,
"r_y1": 163.08,
"r_x2": 545.12,
"r_y2": 154.18,
"r_x3": 308.86,
"r_y3": 154.18,
"coord_origin": "TOPLEFT"
},
"text": "ing problem in the document-parsing community, that mo-",
"orig": "ing problem in the document-parsing community, that mo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 175.04,
"r_x1": 522.56,
"r_y1": 175.04,
"r_x2": 522.56,
"r_y2": 166.13,
"r_x3": 308.86,
"r_y3": 166.13,
"coord_origin": "TOPLEFT"
},
"text": "tivates many organised public challenges [6, 4, 14].",
"orig": "tivates many organised public challenges [6, 4, 14].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 175.04,
"r_x1": 545.12,
"r_y1": 175.04,
"r_x2": 545.12,
"r_y2": 166.13,
"r_x3": 529.62,
"r_y3": 166.13,
"coord_origin": "TOPLEFT"
},
"text": "The",
"orig": "The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 186.99,
"r_x1": 545.12,
"r_y1": 186.99,
"r_x2": 545.12,
"r_y2": 178.09,
"r_x3": 308.86,
"r_y3": 178.09,
"coord_origin": "TOPLEFT"
},
"text": "difficulty of the problem can be attributed to a number of",
"orig": "difficulty of the problem can be attributed to a number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 198.95,
"r_x1": 545.12,
"r_y1": 198.95,
"r_x2": 545.12,
"r_y2": 190.04,
"r_x3": 308.86,
"r_y3": 190.04,
"coord_origin": "TOPLEFT"
},
"text": "factors. First, there is a large variety in the shapes and sizes",
"orig": "factors. First, there is a large variety in the shapes and sizes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 210.9,
"r_x1": 346.98,
"r_y1": 210.9,
"r_x2": 346.98,
"r_y2": 202.0,
"r_x3": 308.86,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "of tables.",
"orig": "of tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.87,
"r_y0": 210.9,
"r_x1": 545.12,
"r_y1": 210.9,
"r_x2": 545.12,
"r_y2": 202.0,
"r_x3": 354.87,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "Such large variety requires a flexible method.",
"orig": "Such large variety requires a flexible method.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 222.86,
"r_x1": 545.12,
"r_y1": 222.86,
"r_x2": 545.12,
"r_y2": 213.95,
"r_x3": 308.86,
"r_y3": 213.95,
"coord_origin": "TOPLEFT"
},
"text": "This is especially true for complex column- and row head-",
"orig": "This is especially true for complex column- and row head-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 234.81,
"r_x1": 530.92,
"r_y1": 234.81,
"r_x2": 530.92,
"r_y2": 225.91,
"r_x3": 308.86,
"r_y3": 225.91,
"coord_origin": "TOPLEFT"
},
"text": "ers, which can be extremely intricate and demanding.",
"orig": "ers, which can be extremely intricate and demanding.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.92,
"r_y0": 234.81,
"r_x1": 545.12,
"r_y1": 234.81,
"r_x2": 545.12,
"r_y2": 225.91,
"r_x3": 537.92,
"r_y3": 225.91,
"coord_origin": "TOPLEFT"
},
"text": "A",
"orig": "A",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 246.77,
"r_x1": 545.12,
"r_y1": 246.77,
"r_x2": 545.12,
"r_y2": 237.86,
"r_x3": 308.86,
"r_y3": 237.86,
"coord_origin": "TOPLEFT"
},
"text": "second factor of complexity is the lack of data with regard",
"orig": "second factor of complexity is the lack of data with regard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.72,
"r_x1": 545.12,
"r_y1": 258.72,
"r_x2": 545.12,
"r_y2": 249.82,
"r_x3": 308.86,
"r_y3": 249.82,
"coord_origin": "TOPLEFT"
},
"text": "to table-structure. Until the publication of PubTabNet [37],",
"orig": "to table-structure. Until the publication of PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.68,
"r_x1": 439.84,
"r_y1": 270.68,
"r_x2": 439.84,
"r_y2": 261.77,
"r_x3": 308.86,
"r_y3": 261.77,
"coord_origin": "TOPLEFT"
},
"text": "there were no large datasets (i.e.",
"orig": "there were no large datasets (i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.44,
"r_y0": 270.46,
"r_x1": 452.19,
"r_y1": 270.46,
"r_x2": 452.19,
"r_y2": 261.61,
"r_x3": 444.44,
"r_y3": 261.61,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.89,
"r_y0": 270.46,
"r_x1": 470.83,
"r_y1": 270.46,
"r_x2": 470.83,
"r_y2": 261.61,
"r_x3": 455.89,
"r_y3": 261.61,
"coord_origin": "TOPLEFT"
},
"text": "100",
"orig": "100",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 470.83,
"r_y0": 270.68,
"r_x1": 545.12,
"r_y1": 270.68,
"r_x2": 545.12,
"r_y2": 261.77,
"r_x3": 470.83,
"r_y3": 261.77,
"coord_origin": "TOPLEFT"
},
"text": "K tables) that pro-",
"orig": "K tables) that pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.63,
"r_x1": 545.12,
"r_y1": 282.63,
"r_x2": 545.12,
"r_y2": 273.73,
"r_x3": 308.86,
"r_y3": 273.73,
"coord_origin": "TOPLEFT"
},
"text": "vided structure information. This happens primarily due to",
"orig": "vided structure information. This happens primarily due to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.59,
"r_x1": 545.12,
"r_y1": 294.59,
"r_x2": 545.12,
"r_y2": 285.68,
"r_x3": 308.86,
"r_y3": 285.68,
"coord_origin": "TOPLEFT"
},
"text": "the fact that tables are notoriously time-consuming to an-",
"orig": "the fact that tables are notoriously time-consuming to an-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 306.55,
"r_x1": 545.12,
"r_y1": 306.55,
"r_x2": 545.12,
"r_y2": 297.64,
"r_x3": 308.86,
"r_y3": 297.64,
"coord_origin": "TOPLEFT"
},
"text": "notate by hand. However, this has definitely changed in re-",
"orig": "notate by hand. However, this has definitely changed in re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 318.5,
"r_x1": 545.12,
"r_y1": 318.5,
"r_x2": 545.12,
"r_y2": 309.59,
"r_x3": 308.86,
"r_y3": 309.59,
"coord_origin": "TOPLEFT"
},
"text": "cent years with the deliverance of PubTabNet [37], FinTab-",
"orig": "cent years with the deliverance of PubTabNet [37], FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 330.46,
"r_x1": 425.92,
"r_y1": 330.46,
"r_x2": 425.92,
"r_y2": 321.55,
"r_x3": 308.86,
"r_y3": 321.55,
"coord_origin": "TOPLEFT"
},
"text": "Net [36], TableBank [17] etc.",
"orig": "Net [36], TableBank [17] etc.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc."
},
{
"label": "text",
"id": 1,
"page_no": 1,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 333.57,
"r": 545.12,
"b": 450.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 342.48,
"r_x1": 545.11,
"r_y1": 342.48,
"r_x2": 545.11,
"r_y2": 333.57,
"r_x3": 320.82,
"r_y3": 333.57,
"coord_origin": "TOPLEFT"
},
"text": "Before the rising popularity of deep neural networks,",
"orig": "Before the rising popularity of deep neural networks,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 354.43,
"r_x1": 545.11,
"r_y1": 354.43,
"r_x2": 545.11,
"r_y2": 345.52,
"r_x3": 308.86,
"r_y3": 345.52,
"coord_origin": "TOPLEFT"
},
"text": "the community relied heavily on heuristic and/or statistical",
"orig": "the community relied heavily on heuristic and/or statistical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 366.39,
"r_x1": 545.12,
"r_y1": 366.39,
"r_x2": 545.12,
"r_y2": 357.48,
"r_x3": 308.86,
"r_y3": 357.48,
"coord_origin": "TOPLEFT"
},
"text": "methods to do table structure identification [3, 7, 11, 5, 13,",
"orig": "methods to do table structure identification [3, 7, 11, 5, 13,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 378.34,
"r_x1": 545.12,
"r_y1": 378.34,
"r_x2": 545.12,
"r_y2": 369.44,
"r_x3": 308.86,
"r_y3": 369.44,
"coord_origin": "TOPLEFT"
},
"text": "28]. Although such methods work well on constrained ta-",
"orig": "28]. Although such methods work well on constrained ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 390.3,
"r_x1": 545.12,
"r_y1": 390.3,
"r_x2": 545.12,
"r_y2": 381.39,
"r_x3": 308.86,
"r_y3": 381.39,
"coord_origin": "TOPLEFT"
},
"text": "bles [12], a more data-driven approach can be applied due",
"orig": "bles [12], a more data-driven approach can be applied due",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 402.25,
"r_x1": 545.12,
"r_y1": 402.25,
"r_x2": 545.12,
"r_y2": 393.35,
"r_x3": 308.86,
"r_y3": 393.35,
"coord_origin": "TOPLEFT"
},
"text": "to the advent of convolutional neural networks (CNNs) and",
"orig": "to the advent of convolutional neural networks (CNNs) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 414.21,
"r_x1": 545.12,
"r_y1": 414.21,
"r_x2": 545.12,
"r_y2": 405.3,
"r_x3": 308.86,
"r_y3": 405.3,
"coord_origin": "TOPLEFT"
},
"text": "the availability of large datasets. To the best-of-our knowl-",
"orig": "the availability of large datasets. To the best-of-our knowl-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 426.16,
"r_x1": 545.12,
"r_y1": 426.16,
"r_x2": 545.12,
"r_y2": 417.26,
"r_x3": 308.86,
"r_y3": 417.26,
"coord_origin": "TOPLEFT"
},
"text": "edge, there are currently two different types of network ar-",
"orig": "edge, there are currently two different types of network ar-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 438.12,
"r_x1": 545.12,
"r_y1": 438.12,
"r_x2": 545.12,
"r_y2": 429.21,
"r_x3": 308.86,
"r_y3": 429.21,
"coord_origin": "TOPLEFT"
},
"text": "chitecture that are being pursued for state-of-the-art table-",
"orig": "chitecture that are being pursued for state-of-the-art table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 450.07,
"r_x1": 401.29,
"r_y1": 450.07,
"r_x2": 401.29,
"r_y2": 441.17,
"r_x3": 308.86,
"r_y3": 441.17,
"coord_origin": "TOPLEFT"
},
"text": "structure identification.",
"orig": "structure identification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification."
},
{
"label": "text",
"id": 3,
"page_no": 1,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 453.07,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 462.02,
"r_x1": 423.26,
"r_y1": 462.02,
"r_x2": 423.26,
"r_y2": 453.07,
"r_x3": 320.82,
"r_y3": 453.07,
"coord_origin": "TOPLEFT"
},
"text": "Image-to-Text networks",
"orig": "Image-to-Text networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.27,
"r_y0": 462.09,
"r_x1": 545.11,
"r_y1": 462.09,
"r_x2": 545.11,
"r_y2": 453.19,
"r_x3": 423.27,
"r_y3": 453.19,
"coord_origin": "TOPLEFT"
},
"text": ": In this type of network, one",
"orig": ": In this type of network, one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 474.05,
"r_x1": 545.12,
"r_y1": 474.05,
"r_x2": 545.12,
"r_y2": 465.14,
"r_x3": 308.86,
"r_y3": 465.14,
"coord_origin": "TOPLEFT"
},
"text": "predicts a sequence of tokens starting from an encoded",
"orig": "predicts a sequence of tokens starting from an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 486.0,
"r_x1": 335.7,
"r_y1": 486.0,
"r_x2": 335.7,
"r_y2": 477.1,
"r_x3": 308.86,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.85,
"r_y0": 486.0,
"r_x1": 545.12,
"r_y1": 486.0,
"r_x2": 545.12,
"r_y2": 477.1,
"r_x3": 345.85,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "Such sequences of tokens can be HTML table",
"orig": "Such sequences of tokens can be HTML table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.96,
"r_x1": 545.11,
"r_y1": 497.96,
"r_x2": 545.11,
"r_y2": 489.05,
"r_x3": 308.86,
"r_y3": 489.05,
"coord_origin": "TOPLEFT"
},
"text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.91,
"r_x1": 545.11,
"r_y1": 509.91,
"r_x2": 545.11,
"r_y2": 501.01,
"r_x3": 308.86,
"r_y3": 501.01,
"coord_origin": "TOPLEFT"
},
"text": "bols is ultimately not very important, since one can be trans-",
"orig": "bols is ultimately not very important, since one can be trans-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.87,
"r_x1": 545.12,
"r_y1": 521.87,
"r_x2": 545.12,
"r_y2": 512.96,
"r_x3": 308.86,
"r_y3": 512.96,
"coord_origin": "TOPLEFT"
},
"text": "formed into the other. There are however subtle variations",
"orig": "formed into the other. There are however subtle variations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.82,
"r_x1": 545.12,
"r_y1": 533.82,
"r_x2": 545.12,
"r_y2": 524.92,
"r_x3": 308.86,
"r_y3": 524.92,
"coord_origin": "TOPLEFT"
},
"text": "in the Image-to-Text networks. The easiest network archi-",
"orig": "in the Image-to-Text networks. The easiest network archi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.78,
"r_x1": 420.94,
"r_y1": 545.78,
"r_x2": 420.94,
"r_y2": 536.87,
"r_x3": 308.86,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "tectures are \u201cimage-encoder",
"orig": "tectures are \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.59,
"r_y0": 545.56,
"r_x1": 433.56,
"r_y1": 545.56,
"r_x2": 433.56,
"r_y2": 536.16,
"r_x3": 423.59,
"r_y3": 536.16,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.21,
"r_y0": 545.78,
"r_x1": 545.11,
"r_y1": 545.78,
"r_x2": 545.11,
"r_y2": 536.87,
"r_x3": 436.21,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "text-decoder\u201d (IETD), sim-",
"orig": "text-decoder\u201d (IETD), sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.73,
"r_x1": 545.12,
"r_y1": 557.73,
"r_x2": 545.12,
"r_y2": 548.83,
"r_x3": 308.86,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "ilar to network architectures that try to provide captions to",
"orig": "ilar to network architectures that try to provide captions to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.69,
"r_x1": 545.11,
"r_y1": 569.69,
"r_x2": 545.11,
"r_y2": 560.78,
"r_x3": 308.86,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "images [32]. In these IETD networks, one expects as output",
"orig": "images [32]. In these IETD networks, one expects as output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.64,
"r_x1": 545.11,
"r_y1": 581.64,
"r_x2": 545.11,
"r_y2": 572.74,
"r_x3": 308.86,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"orig": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.6,
"r_x1": 545.12,
"r_y1": 593.6,
"r_x2": 545.12,
"r_y2": 584.69,
"r_x3": 308.86,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "bols necessary for creating the table with the content of the",
"orig": "bols necessary for creating the table with the content of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.56,
"r_x1": 497.08,
"r_y1": 605.56,
"r_x2": 497.08,
"r_y2": 596.65,
"r_x3": 308.86,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "table. Another approach is the \u201cimage-encoder",
"orig": "table. Another approach is the \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.8,
"r_y0": 605.34,
"r_x1": 509.77,
"r_y1": 605.34,
"r_x2": 509.77,
"r_y2": 595.93,
"r_x3": 499.8,
"r_y3": 595.93,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.5,
"r_y0": 605.56,
"r_x1": 545.11,
"r_y1": 605.56,
"r_x2": 545.11,
"r_y2": 596.65,
"r_x3": 512.5,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "dual de-",
"orig": "dual de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.51,
"r_x1": 545.12,
"r_y1": 617.51,
"r_x2": 545.12,
"r_y2": 608.6,
"r_x3": 308.86,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "coder\u201d (IEDD) networks. In these type of networks, one has",
"orig": "coder\u201d (IEDD) networks. In these type of networks, one has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.47,
"r_x1": 545.12,
"r_y1": 629.47,
"r_x2": 545.12,
"r_y2": 620.56,
"r_x3": 308.86,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "two consecutive decoders with different purposes. The first",
"orig": "two consecutive decoders with different purposes. The first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.42,
"r_x1": 364.78,
"r_y1": 641.42,
"r_x2": 364.78,
"r_y2": 632.51,
"r_x3": 308.86,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "decoder is the",
"orig": "decoder is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.57,
"r_y0": 641.19,
"r_x1": 415.61,
"r_y1": 641.19,
"r_x2": 415.61,
"r_y2": 632.6,
"r_x3": 367.57,
"r_y3": 632.6,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.61,
"r_y0": 641.42,
"r_x1": 545.12,
"r_y1": 641.42,
"r_x2": 545.12,
"r_y2": 632.51,
"r_x3": 415.61,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": ", i.e. it only produces the HTM-",
"orig": ", i.e. it only produces the HTM-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.38,
"r_x1": 545.12,
"r_y1": 653.38,
"r_x2": 545.12,
"r_y2": 644.47,
"r_x3": 308.86,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "L/LaTeX tags which construct an empty table. The second",
"orig": "L/LaTeX tags which construct an empty table. The second",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.1,
"r_x1": 373.6,
"r_y1": 665.1,
"r_x2": 373.6,
"r_y2": 656.51,
"r_x3": 308.86,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "content-decoder",
"orig": "content-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.91,
"r_y0": 665.33,
"r_x1": 545.12,
"r_y1": 665.33,
"r_x2": 545.12,
"r_y2": 656.43,
"r_x3": 376.91,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "uses the encoding of the image in combi-",
"orig": "uses the encoding of the image in combi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.12,
"r_y1": 677.29,
"r_x2": 545.12,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "nation with the output encoding of each cell-tag (from the",
"orig": "nation with the output encoding of each cell-tag (from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.01,
"r_x1": 356.9,
"r_y1": 689.01,
"r_x2": 356.9,
"r_y2": 680.42,
"r_x3": 308.86,
"r_y3": 680.42,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.13,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 357.13,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": ") to generate the textual content of each table",
"orig": ") to generate the textual content of each table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "cell. The network architecture of IEDD is certainly more",
"orig": "cell. The network architecture of IEDD is certainly more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "elaborate, but it has the advantage that one can pre-train the",
"orig": "elaborate, but it has the advantage that one can pre-train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are \"image-encoder \u2192 text-decoder\" (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the \"image-encoder \u2192 dual decoder\" (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the"
},
{
"label": "page_footer",
"id": 15,
"page_no": 1,
"cluster": {
"id": 15,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.878,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2"
}
],
"body": [
{
"label": "text",
"id": 12,
"page_no": 1,
"cluster": {
"id": 12,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 96.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.966,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "considered as a solved problem, given enough ground-truth",
"orig": "considered as a solved problem, given enough ground-truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 112.65,
"r_y1": 96.07,
"r_x2": 112.65,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "data to train on.",
"orig": "data to train on.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "considered as a solved problem, given enough ground-truth data to train on."
},
{
"label": "text",
"id": 4,
"page_no": 1,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 99.57,
"r": 286.37,
"b": 228.03,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 108.48,
"r_x1": 286.36,
"r_y1": 108.48,
"r_x2": 286.36,
"r_y2": 99.57,
"r_x3": 62.07,
"r_y3": 99.57,
"coord_origin": "TOPLEFT"
},
"text": "The second problem is called table-structure decompo-",
"orig": "The second problem is called table-structure decompo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 120.43,
"r_x1": 74.75,
"r_y1": 120.43,
"r_x2": 74.75,
"r_y2": 111.53,
"r_x3": 50.11,
"r_y3": 111.53,
"coord_origin": "TOPLEFT"
},
"text": "sition.",
"orig": "sition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.33,
"r_y0": 120.43,
"r_x1": 286.37,
"r_y1": 120.43,
"r_x2": 286.37,
"r_y2": 111.53,
"r_x3": 81.33,
"r_y3": 111.53,
"coord_origin": "TOPLEFT"
},
"text": "The latter is a long standing problem in the com-",
"orig": "The latter is a long standing problem in the com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 132.39,
"r_x1": 286.37,
"r_y1": 132.39,
"r_x2": 286.37,
"r_y2": 123.48,
"r_x3": 50.11,
"r_y3": 123.48,
"coord_origin": "TOPLEFT"
},
"text": "munity of document understanding [6, 4, 14]. Contrary to",
"orig": "munity of document understanding [6, 4, 14]. Contrary to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 144.34,
"r_x1": 286.37,
"r_y1": 144.34,
"r_x2": 286.37,
"r_y2": 135.44,
"r_x3": 50.11,
"r_y3": 135.44,
"coord_origin": "TOPLEFT"
},
"text": "the table-location problem, there are no commonly used ap-",
"orig": "the table-location problem, there are no commonly used ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 156.3,
"r_x1": 286.37,
"r_y1": 156.3,
"r_x2": 286.37,
"r_y2": 147.39,
"r_x3": 50.11,
"r_y3": 147.39,
"coord_origin": "TOPLEFT"
},
"text": "proaches that can easily be re-purposed to solve this prob-",
"orig": "proaches that can easily be re-purposed to solve this prob-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 168.25,
"r_x1": 286.37,
"r_y1": 168.25,
"r_x2": 286.37,
"r_y2": 159.35,
"r_x3": 50.11,
"r_y3": 159.35,
"coord_origin": "TOPLEFT"
},
"text": "lem. Lately, a set of new model-architectures has been pro-",
"orig": "lem. Lately, a set of new model-architectures has been pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 180.21,
"r_x1": 286.37,
"r_y1": 180.21,
"r_x2": 286.37,
"r_y2": 171.3,
"r_x3": 50.11,
"r_y3": 171.3,
"coord_origin": "TOPLEFT"
},
"text": "posed by the community to address table-structure decom-",
"orig": "posed by the community to address table-structure decom-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 192.16,
"r_x1": 286.37,
"r_y1": 192.16,
"r_x2": 286.37,
"r_y2": 183.26,
"r_x3": 50.11,
"r_y3": 183.26,
"coord_origin": "TOPLEFT"
},
"text": "position [37, 36, 18, 20]. All these models have some weak-",
"orig": "position [37, 36, 18, 20]. All these models have some weak-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 204.12,
"r_x1": 286.37,
"r_y1": 204.12,
"r_x2": 286.37,
"r_y2": 195.21,
"r_x3": 50.11,
"r_y3": 195.21,
"coord_origin": "TOPLEFT"
},
"text": "nesses (see Sec. 2). The common denominator here is the",
"orig": "nesses (see Sec. 2). The common denominator here is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 216.07,
"r_x1": 286.37,
"r_y1": 216.07,
"r_x2": 286.37,
"r_y2": 207.17,
"r_x3": 50.11,
"r_y3": 207.17,
"coord_origin": "TOPLEFT"
},
"text": "reliance on textual features and/or the inability to provide",
"orig": "reliance on textual features and/or the inability to provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 228.03,
"r_x1": 278.66,
"r_y1": 228.03,
"r_x2": 278.66,
"r_y2": 219.12,
"r_x3": 50.11,
"r_y3": 219.12,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table-cell in the original image.",
"orig": "the bounding box of each table-cell in the original image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image."
},
{
"label": "text",
"id": 2,
"page_no": 1,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 231.53,
"r": 286.37,
"b": 371.95,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 240.44,
"r_x1": 286.36,
"r_y1": 240.44,
"r_x2": 286.36,
"r_y2": 231.53,
"r_x3": 62.07,
"r_y3": 231.53,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we want to address these weaknesses and",
"orig": "In this paper, we want to address these weaknesses and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 252.39,
"r_x1": 286.37,
"r_y1": 252.39,
"r_x2": 286.37,
"r_y2": 243.49,
"r_x3": 50.11,
"r_y3": 243.49,
"coord_origin": "TOPLEFT"
},
"text": "present a robust table-structure decomposition algorithm.",
"orig": "present a robust table-structure decomposition algorithm.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.35,
"r_x1": 286.37,
"r_y1": 264.35,
"r_x2": 286.37,
"r_y2": 255.44,
"r_x3": 50.11,
"r_y3": 255.44,
"coord_origin": "TOPLEFT"
},
"text": "The design criteria for our model are the following. First,",
"orig": "The design criteria for our model are the following. First,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.3,
"r_x1": 286.37,
"r_y1": 276.3,
"r_x2": 286.37,
"r_y2": 267.4,
"r_x3": 50.11,
"r_y3": 267.4,
"coord_origin": "TOPLEFT"
},
"text": "we want our algorithm to be language agnostic. In this way,",
"orig": "we want our algorithm to be language agnostic. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.26,
"r_x1": 286.37,
"r_y1": 288.26,
"r_x2": 286.37,
"r_y2": 279.35,
"r_x3": 50.11,
"r_y3": 279.35,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the structure of any table, irregardless of the",
"orig": "we can obtain the structure of any table, irregardless of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.21,
"r_x1": 88.57,
"r_y1": 300.21,
"r_x2": 88.57,
"r_y2": 291.31,
"r_x3": 50.11,
"r_y3": 291.31,
"coord_origin": "TOPLEFT"
},
"text": "language.",
"orig": "language.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 95.5,
"r_y0": 300.21,
"r_x1": 286.37,
"r_y1": 300.21,
"r_x2": 286.37,
"r_y2": 291.31,
"r_x3": 95.5,
"r_y3": 291.31,
"coord_origin": "TOPLEFT"
},
"text": "Second, we want our algorithm to leverage as",
"orig": "Second, we want our algorithm to leverage as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.17,
"r_x1": 286.37,
"r_y1": 312.17,
"r_x2": 286.37,
"r_y2": 303.26,
"r_x3": 50.11,
"r_y3": 303.26,
"coord_origin": "TOPLEFT"
},
"text": "much data as possible from the original PDF document. For",
"orig": "much data as possible from the original PDF document. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.12,
"r_x1": 286.37,
"r_y1": 324.12,
"r_x2": 286.37,
"r_y2": 315.22,
"r_x3": 50.11,
"r_y3": 315.22,
"coord_origin": "TOPLEFT"
},
"text": "programmatic PDF documents, the text-cells can often be",
"orig": "programmatic PDF documents, the text-cells can often be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.08,
"r_x1": 286.37,
"r_y1": 336.08,
"r_x2": 286.37,
"r_y2": 327.17,
"r_x3": 50.11,
"r_y3": 327.17,
"coord_origin": "TOPLEFT"
},
"text": "extracted much faster and with higher accuracy compared",
"orig": "extracted much faster and with higher accuracy compared",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.03,
"r_x1": 286.37,
"r_y1": 348.03,
"r_x2": 286.37,
"r_y2": 339.13,
"r_x3": 50.11,
"r_y3": 339.13,
"coord_origin": "TOPLEFT"
},
"text": "to OCR methods. Last but not least, we want to have a di-",
"orig": "to OCR methods. Last but not least, we want to have a di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.99,
"r_x1": 286.37,
"r_y1": 359.99,
"r_x2": 286.37,
"r_y2": 351.08,
"r_x3": 50.11,
"r_y3": 351.08,
"coord_origin": "TOPLEFT"
},
"text": "rect link between the table-cell and its bounding box in the",
"orig": "rect link between the table-cell and its bounding box in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.95,
"r_x1": 76.95,
"r_y1": 371.95,
"r_x2": 76.95,
"r_y2": 363.04,
"r_x3": 50.11,
"r_y3": 363.04,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image."
},
{
"label": "text",
"id": 7,
"page_no": 1,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 375.45,
"r": 286.37,
"b": 432.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 384.35,
"r_x1": 286.36,
"r_y1": 384.35,
"r_x2": 286.36,
"r_y2": 375.45,
"r_x3": 62.07,
"r_y3": 375.45,
"coord_origin": "TOPLEFT"
},
"text": "To meet the design criteria listed above, we developed a",
"orig": "To meet the design criteria listed above, we developed a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.31,
"r_x1": 120.99,
"r_y1": 396.31,
"r_x2": 120.99,
"r_y2": 387.4,
"r_x3": 50.11,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "new model called",
"orig": "new model called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 123.9,
"r_y0": 396.24,
"r_x1": 179.73,
"r_y1": 396.24,
"r_x2": 179.73,
"r_y2": 387.28,
"r_x3": 123.9,
"r_y3": 387.28,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.65,
"r_y0": 396.31,
"r_x1": 286.37,
"r_y1": 396.31,
"r_x2": 286.37,
"r_y2": 387.4,
"r_x3": 182.65,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "and a synthetically gener-",
"orig": "and a synthetically gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 408.26,
"r_x1": 181.76,
"r_y1": 408.26,
"r_x2": 181.76,
"r_y2": 399.36,
"r_x3": 50.11,
"r_y3": 399.36,
"coord_origin": "TOPLEFT"
},
"text": "ated table structure dataset called",
"orig": "ated table structure dataset called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.1,
"r_y0": 408.19,
"r_x1": 240.2,
"r_y1": 408.19,
"r_x2": 240.2,
"r_y2": 399.24,
"r_x3": 184.1,
"r_y3": 399.24,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.2,
"r_y0": 408.26,
"r_x1": 286.36,
"r_y1": 408.26,
"r_x2": 286.36,
"r_y2": 399.36,
"r_x3": 240.2,
"r_y3": 399.36,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$. In partic-",
"orig": "$^{1}$. In partic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 420.22,
"r_x1": 286.37,
"r_y1": 420.22,
"r_x2": 286.37,
"r_y2": 411.31,
"r_x3": 50.11,
"r_y3": 411.31,
"coord_origin": "TOPLEFT"
},
"text": "ular, our contributions in this work can be summarised as",
"orig": "ular, our contributions in this work can be summarised as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 432.17,
"r_x1": 82.52,
"r_y1": 432.17,
"r_x2": 82.52,
"r_y2": 423.27,
"r_x3": 50.11,
"r_y3": 423.27,
"coord_origin": "TOPLEFT"
},
"text": "follows:",
"orig": "follows:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet $^{1}$. In particular, our contributions in this work can be summarised as follows:"
},
{
"label": "list_item",
"id": 6,
"page_no": 1,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 444.43,
"r": 286.36,
"b": 489.32,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 453.46,
"r_x1": 70.74,
"r_y1": 453.46,
"r_x2": 70.74,
"r_y2": 444.55,
"r_x3": 61.57,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.03,
"r_y0": 453.46,
"r_x1": 117.1,
"r_y1": 453.46,
"r_x2": 117.1,
"r_y2": 444.55,
"r_x3": 73.03,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": "We propose",
"orig": "We propose",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.59,
"r_y0": 453.39,
"r_x1": 175.42,
"r_y1": 453.39,
"r_x2": 175.42,
"r_y2": 444.43,
"r_x3": 119.59,
"r_y3": 444.43,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.42,
"r_y0": 453.46,
"r_x1": 286.36,
"r_y1": 453.46,
"r_x2": 286.36,
"r_y2": 444.55,
"r_x3": 175.42,
"r_y3": 444.55,
"coord_origin": "TOPLEFT"
},
"text": ", a transformer based model",
"orig": ", a transformer based model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 465.41,
"r_x1": 286.36,
"r_y1": 465.41,
"r_x2": 286.36,
"r_y2": 456.51,
"r_x3": 70.04,
"r_y3": 456.51,
"coord_origin": "TOPLEFT"
},
"text": "that predicts tables structure and bounding boxes for",
"orig": "that predicts tables structure and bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 477.37,
"r_x1": 286.36,
"r_y1": 477.37,
"r_x2": 286.36,
"r_y2": 468.46,
"r_x3": 70.04,
"r_y3": 468.46,
"coord_origin": "TOPLEFT"
},
"text": "the table content simultaneously in an end-to-end ap-",
"orig": "the table content simultaneously in an end-to-end ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 489.32,
"r_x1": 99.64,
"r_y1": 489.32,
"r_x2": 99.64,
"r_y2": 480.42,
"r_x3": 70.04,
"r_y3": 480.42,
"coord_origin": "TOPLEFT"
},
"text": "proach.",
"orig": "proach.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach."
},
{
"label": "list_item",
"id": 5,
"page_no": 1,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 502.03,
"r": 286.36,
"b": 546.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 511.06,
"r_x1": 71.62,
"r_y1": 511.06,
"r_x2": 71.62,
"r_y2": 502.15,
"r_x3": 61.57,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.13,
"r_y0": 511.06,
"r_x1": 196.1,
"r_y1": 511.06,
"r_x2": 196.1,
"r_y2": 502.15,
"r_x3": 74.13,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "Across all benchmark datasets",
"orig": "Across all benchmark datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.31,
"r_y0": 510.99,
"r_x1": 256.14,
"r_y1": 510.99,
"r_x2": 256.14,
"r_y2": 502.03,
"r_x3": 200.31,
"r_y3": 502.03,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.35,
"r_y0": 511.06,
"r_x1": 286.36,
"r_y1": 511.06,
"r_x2": 286.36,
"r_y2": 502.15,
"r_x3": 260.35,
"r_y3": 502.15,
"coord_origin": "TOPLEFT"
},
"text": "signif-",
"orig": "signif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 523.01,
"r_x1": 286.36,
"r_y1": 523.01,
"r_x2": 286.36,
"r_y2": 514.11,
"r_x3": 70.04,
"r_y3": 514.11,
"coord_origin": "TOPLEFT"
},
"text": "icantly outperforms existing state-of-the-art metrics,",
"orig": "icantly outperforms existing state-of-the-art metrics,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 534.97,
"r_x1": 286.36,
"r_y1": 534.97,
"r_x2": 286.36,
"r_y2": 526.06,
"r_x3": 70.04,
"r_y3": 526.06,
"coord_origin": "TOPLEFT"
},
"text": "while being much more efficient in training and infer-",
"orig": "while being much more efficient in training and infer-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 546.93,
"r_x1": 161.65,
"r_y1": 546.93,
"r_x2": 161.65,
"r_y2": 538.02,
"r_x3": 70.04,
"r_y3": 538.02,
"coord_origin": "TOPLEFT"
},
"text": "ence to existing works.",
"orig": "ence to existing works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works."
},
{
"label": "list_item",
"id": 9,
"page_no": 1,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 559.64,
"r": 286.36,
"b": 592.57,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 568.66,
"r_x1": 71.12,
"r_y1": 568.66,
"r_x2": 71.12,
"r_y2": 559.76,
"r_x3": 61.57,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 568.66,
"r_x1": 116.71,
"r_y1": 568.66,
"r_x2": 116.71,
"r_y2": 559.76,
"r_x3": 73.5,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "We present",
"orig": "We present",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 121.58,
"r_y0": 568.59,
"r_x1": 177.68,
"r_y1": 568.59,
"r_x2": 177.68,
"r_y2": 559.64,
"r_x3": 121.58,
"r_y3": 559.64,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.55,
"r_y0": 568.66,
"r_x1": 286.36,
"r_y1": 568.66,
"r_x2": 286.36,
"r_y2": 559.76,
"r_x3": 182.55,
"r_y3": 559.76,
"coord_origin": "TOPLEFT"
},
"text": "a synthetically generated",
"orig": "a synthetically generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 580.62,
"r_x1": 286.36,
"r_y1": 580.62,
"r_x2": 286.36,
"r_y2": 571.71,
"r_x3": 70.04,
"r_y3": 571.71,
"coord_origin": "TOPLEFT"
},
"text": "dataset, with various appearance styles and complex-",
"orig": "dataset, with various appearance styles and complex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 592.57,
"r_x1": 82.4,
"r_y1": 592.57,
"r_x2": 82.4,
"r_y2": 583.67,
"r_x3": 70.04,
"r_y3": 583.67,
"coord_origin": "TOPLEFT"
},
"text": "ity.",
"orig": "ity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity."
},
{
"label": "list_item",
"id": 8,
"page_no": 1,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 605.4,
"r": 286.37,
"b": 638.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.981,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 614.31,
"r_x1": 72.33,
"r_y1": 614.31,
"r_x2": 72.33,
"r_y2": 605.4,
"r_x3": 61.57,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.02,
"r_y0": 614.31,
"r_x1": 286.37,
"r_y1": 614.31,
"r_x2": 286.37,
"r_y2": 605.4,
"r_x3": 75.02,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "An augmented dataset based on PubTabNet [37],",
"orig": "An augmented dataset based on PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 626.26,
"r_x1": 286.36,
"r_y1": 626.26,
"r_x2": 286.36,
"r_y2": 617.36,
"r_x3": 70.04,
"r_y3": 617.36,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] with generated",
"orig": "FinTabNet [36], and TableBank [17] with generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 638.22,
"r_x1": 198.06,
"r_y1": 638.22,
"r_x2": 198.06,
"r_y2": 629.31,
"r_x3": 70.04,
"r_y3": 629.31,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth for reproducibility.",
"orig": "ground-truth for reproducibility.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility."
},
{
"label": "text",
"id": 11,
"page_no": 1,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 650.6,
"r": 286.37,
"b": 695.37,
"coord_origin": "TOPLEFT"
},
"confidence": 0.974,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 659.5,
"r_x1": 286.36,
"r_y1": 659.5,
"r_x2": 286.36,
"r_y2": 650.6,
"r_x3": 62.07,
"r_y3": 650.6,
"coord_origin": "TOPLEFT"
},
"text": "The paper is structured as follows. In Sec. 2, we give",
"orig": "The paper is structured as follows. In Sec. 2, we give",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 671.46,
"r_x1": 286.37,
"r_y1": 671.46,
"r_x2": 286.37,
"r_y2": 662.55,
"r_x3": 50.11,
"r_y3": 662.55,
"coord_origin": "TOPLEFT"
},
"text": "a brief overview of the current state-of-the-art. In Sec. 3,",
"orig": "a brief overview of the current state-of-the-art. In Sec. 3,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 683.41,
"r_x1": 286.37,
"r_y1": 683.41,
"r_x2": 286.37,
"r_y2": 674.51,
"r_x3": 50.11,
"r_y3": 674.51,
"coord_origin": "TOPLEFT"
},
"text": "we describe the datasets on which we train. In Sec. 4, we",
"orig": "we describe the datasets on which we train. In Sec. 4, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 695.37,
"r_x1": 286.37,
"r_y1": 695.37,
"r_x2": 286.37,
"r_y2": 686.46,
"r_x3": 50.11,
"r_y3": 686.46,
"coord_origin": "TOPLEFT"
},
"text": "introduce the TableFormer model-architecture and describe",
"orig": "introduce the TableFormer model-architecture and describe",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe"
},
{
"label": "footnote",
"id": 14,
"page_no": 1,
"cluster": {
"id": 14,
"label": "footnote",
"bbox": {
"l": 60.97,
"t": 705.6,
"r": 183.73,
"b": 712.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.895,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.97,
"r_y0": 712.72,
"r_x1": 183.73,
"r_y1": 712.72,
"r_x2": 183.73,
"r_y2": 705.6,
"r_x3": 60.97,
"r_y3": 705.6,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet",
"orig": "$^{1}$https://github.com/IBM/SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet"
},
{
"label": "text",
"id": 10,
"page_no": 1,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.977,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 545.12,
"r_y1": 84.11,
"r_x2": 545.12,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "its results & performance in Sec. 5. As a conclusion, we de-",
"orig": "its results & performance in Sec. 5. As a conclusion, we de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "scribe how this new model-architecture can be re-purposed",
"orig": "scribe how this new model-architecture can be re-purposed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 508.08,
"r_y1": 108.02,
"r_x2": 508.08,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "for other tasks in the computer-vision community.",
"orig": "for other tasks in the computer-vision community.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "its results & performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community."
},
{
"label": "section_header",
"id": 13,
"page_no": 1,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 121.73,
"r": 498.28,
"b": 132.48,
"coord_origin": "TOPLEFT"
},
"confidence": 0.943,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 132.48,
"r_x1": 315.58,
"r_y1": 132.48,
"r_x2": 315.58,
"r_y2": 121.73,
"r_x3": 308.86,
"r_y3": 121.73,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 324.54,
"r_y0": 132.48,
"r_x1": 498.28,
"r_y1": 132.48,
"r_x2": 498.28,
"r_y2": 121.73,
"r_x3": 324.54,
"r_y3": 121.73,
"coord_origin": "TOPLEFT"
},
"text": "Previous work and State of the Art",
"orig": "Previous work and State of the Art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Previous work and State of the Art"
},
{
"label": "text",
"id": 0,
"page_no": 1,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 142.22,
"r": 545.12,
"b": 330.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 151.13,
"r_x1": 545.11,
"r_y1": 151.13,
"r_x2": 545.11,
"r_y2": 142.22,
"r_x3": 320.82,
"r_y3": 142.22,
"coord_origin": "TOPLEFT"
},
"text": "Identifying the structure of a table has been an outstand-",
"orig": "Identifying the structure of a table has been an outstand-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 163.08,
"r_x1": 545.12,
"r_y1": 163.08,
"r_x2": 545.12,
"r_y2": 154.18,
"r_x3": 308.86,
"r_y3": 154.18,
"coord_origin": "TOPLEFT"
},
"text": "ing problem in the document-parsing community, that mo-",
"orig": "ing problem in the document-parsing community, that mo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 175.04,
"r_x1": 522.56,
"r_y1": 175.04,
"r_x2": 522.56,
"r_y2": 166.13,
"r_x3": 308.86,
"r_y3": 166.13,
"coord_origin": "TOPLEFT"
},
"text": "tivates many organised public challenges [6, 4, 14].",
"orig": "tivates many organised public challenges [6, 4, 14].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 175.04,
"r_x1": 545.12,
"r_y1": 175.04,
"r_x2": 545.12,
"r_y2": 166.13,
"r_x3": 529.62,
"r_y3": 166.13,
"coord_origin": "TOPLEFT"
},
"text": "The",
"orig": "The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 186.99,
"r_x1": 545.12,
"r_y1": 186.99,
"r_x2": 545.12,
"r_y2": 178.09,
"r_x3": 308.86,
"r_y3": 178.09,
"coord_origin": "TOPLEFT"
},
"text": "difficulty of the problem can be attributed to a number of",
"orig": "difficulty of the problem can be attributed to a number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 198.95,
"r_x1": 545.12,
"r_y1": 198.95,
"r_x2": 545.12,
"r_y2": 190.04,
"r_x3": 308.86,
"r_y3": 190.04,
"coord_origin": "TOPLEFT"
},
"text": "factors. First, there is a large variety in the shapes and sizes",
"orig": "factors. First, there is a large variety in the shapes and sizes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 210.9,
"r_x1": 346.98,
"r_y1": 210.9,
"r_x2": 346.98,
"r_y2": 202.0,
"r_x3": 308.86,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "of tables.",
"orig": "of tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.87,
"r_y0": 210.9,
"r_x1": 545.12,
"r_y1": 210.9,
"r_x2": 545.12,
"r_y2": 202.0,
"r_x3": 354.87,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "Such large variety requires a flexible method.",
"orig": "Such large variety requires a flexible method.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 222.86,
"r_x1": 545.12,
"r_y1": 222.86,
"r_x2": 545.12,
"r_y2": 213.95,
"r_x3": 308.86,
"r_y3": 213.95,
"coord_origin": "TOPLEFT"
},
"text": "This is especially true for complex column- and row head-",
"orig": "This is especially true for complex column- and row head-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 234.81,
"r_x1": 530.92,
"r_y1": 234.81,
"r_x2": 530.92,
"r_y2": 225.91,
"r_x3": 308.86,
"r_y3": 225.91,
"coord_origin": "TOPLEFT"
},
"text": "ers, which can be extremely intricate and demanding.",
"orig": "ers, which can be extremely intricate and demanding.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.92,
"r_y0": 234.81,
"r_x1": 545.12,
"r_y1": 234.81,
"r_x2": 545.12,
"r_y2": 225.91,
"r_x3": 537.92,
"r_y3": 225.91,
"coord_origin": "TOPLEFT"
},
"text": "A",
"orig": "A",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 246.77,
"r_x1": 545.12,
"r_y1": 246.77,
"r_x2": 545.12,
"r_y2": 237.86,
"r_x3": 308.86,
"r_y3": 237.86,
"coord_origin": "TOPLEFT"
},
"text": "second factor of complexity is the lack of data with regard",
"orig": "second factor of complexity is the lack of data with regard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.72,
"r_x1": 545.12,
"r_y1": 258.72,
"r_x2": 545.12,
"r_y2": 249.82,
"r_x3": 308.86,
"r_y3": 249.82,
"coord_origin": "TOPLEFT"
},
"text": "to table-structure. Until the publication of PubTabNet [37],",
"orig": "to table-structure. Until the publication of PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.68,
"r_x1": 439.84,
"r_y1": 270.68,
"r_x2": 439.84,
"r_y2": 261.77,
"r_x3": 308.86,
"r_y3": 261.77,
"coord_origin": "TOPLEFT"
},
"text": "there were no large datasets (i.e.",
"orig": "there were no large datasets (i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.44,
"r_y0": 270.46,
"r_x1": 452.19,
"r_y1": 270.46,
"r_x2": 452.19,
"r_y2": 261.61,
"r_x3": 444.44,
"r_y3": 261.61,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.89,
"r_y0": 270.46,
"r_x1": 470.83,
"r_y1": 270.46,
"r_x2": 470.83,
"r_y2": 261.61,
"r_x3": 455.89,
"r_y3": 261.61,
"coord_origin": "TOPLEFT"
},
"text": "100",
"orig": "100",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 470.83,
"r_y0": 270.68,
"r_x1": 545.12,
"r_y1": 270.68,
"r_x2": 545.12,
"r_y2": 261.77,
"r_x3": 470.83,
"r_y3": 261.77,
"coord_origin": "TOPLEFT"
},
"text": "K tables) that pro-",
"orig": "K tables) that pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.63,
"r_x1": 545.12,
"r_y1": 282.63,
"r_x2": 545.12,
"r_y2": 273.73,
"r_x3": 308.86,
"r_y3": 273.73,
"coord_origin": "TOPLEFT"
},
"text": "vided structure information. This happens primarily due to",
"orig": "vided structure information. This happens primarily due to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.59,
"r_x1": 545.12,
"r_y1": 294.59,
"r_x2": 545.12,
"r_y2": 285.68,
"r_x3": 308.86,
"r_y3": 285.68,
"coord_origin": "TOPLEFT"
},
"text": "the fact that tables are notoriously time-consuming to an-",
"orig": "the fact that tables are notoriously time-consuming to an-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 306.55,
"r_x1": 545.12,
"r_y1": 306.55,
"r_x2": 545.12,
"r_y2": 297.64,
"r_x3": 308.86,
"r_y3": 297.64,
"coord_origin": "TOPLEFT"
},
"text": "notate by hand. However, this has definitely changed in re-",
"orig": "notate by hand. However, this has definitely changed in re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 318.5,
"r_x1": 545.12,
"r_y1": 318.5,
"r_x2": 545.12,
"r_y2": 309.59,
"r_x3": 308.86,
"r_y3": 309.59,
"coord_origin": "TOPLEFT"
},
"text": "cent years with the deliverance of PubTabNet [37], FinTab-",
"orig": "cent years with the deliverance of PubTabNet [37], FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 330.46,
"r_x1": 425.92,
"r_y1": 330.46,
"r_x2": 425.92,
"r_y2": 321.55,
"r_x3": 308.86,
"r_y3": 321.55,
"coord_origin": "TOPLEFT"
},
"text": "Net [36], TableBank [17] etc.",
"orig": "Net [36], TableBank [17] etc.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc."
},
{
"label": "text",
"id": 1,
"page_no": 1,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 333.57,
"r": 545.12,
"b": 450.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 342.48,
"r_x1": 545.11,
"r_y1": 342.48,
"r_x2": 545.11,
"r_y2": 333.57,
"r_x3": 320.82,
"r_y3": 333.57,
"coord_origin": "TOPLEFT"
},
"text": "Before the rising popularity of deep neural networks,",
"orig": "Before the rising popularity of deep neural networks,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 354.43,
"r_x1": 545.11,
"r_y1": 354.43,
"r_x2": 545.11,
"r_y2": 345.52,
"r_x3": 308.86,
"r_y3": 345.52,
"coord_origin": "TOPLEFT"
},
"text": "the community relied heavily on heuristic and/or statistical",
"orig": "the community relied heavily on heuristic and/or statistical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 366.39,
"r_x1": 545.12,
"r_y1": 366.39,
"r_x2": 545.12,
"r_y2": 357.48,
"r_x3": 308.86,
"r_y3": 357.48,
"coord_origin": "TOPLEFT"
},
"text": "methods to do table structure identification [3, 7, 11, 5, 13,",
"orig": "methods to do table structure identification [3, 7, 11, 5, 13,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 378.34,
"r_x1": 545.12,
"r_y1": 378.34,
"r_x2": 545.12,
"r_y2": 369.44,
"r_x3": 308.86,
"r_y3": 369.44,
"coord_origin": "TOPLEFT"
},
"text": "28]. Although such methods work well on constrained ta-",
"orig": "28]. Although such methods work well on constrained ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 390.3,
"r_x1": 545.12,
"r_y1": 390.3,
"r_x2": 545.12,
"r_y2": 381.39,
"r_x3": 308.86,
"r_y3": 381.39,
"coord_origin": "TOPLEFT"
},
"text": "bles [12], a more data-driven approach can be applied due",
"orig": "bles [12], a more data-driven approach can be applied due",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 402.25,
"r_x1": 545.12,
"r_y1": 402.25,
"r_x2": 545.12,
"r_y2": 393.35,
"r_x3": 308.86,
"r_y3": 393.35,
"coord_origin": "TOPLEFT"
},
"text": "to the advent of convolutional neural networks (CNNs) and",
"orig": "to the advent of convolutional neural networks (CNNs) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 414.21,
"r_x1": 545.12,
"r_y1": 414.21,
"r_x2": 545.12,
"r_y2": 405.3,
"r_x3": 308.86,
"r_y3": 405.3,
"coord_origin": "TOPLEFT"
},
"text": "the availability of large datasets. To the best-of-our knowl-",
"orig": "the availability of large datasets. To the best-of-our knowl-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 426.16,
"r_x1": 545.12,
"r_y1": 426.16,
"r_x2": 545.12,
"r_y2": 417.26,
"r_x3": 308.86,
"r_y3": 417.26,
"coord_origin": "TOPLEFT"
},
"text": "edge, there are currently two different types of network ar-",
"orig": "edge, there are currently two different types of network ar-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 438.12,
"r_x1": 545.12,
"r_y1": 438.12,
"r_x2": 545.12,
"r_y2": 429.21,
"r_x3": 308.86,
"r_y3": 429.21,
"coord_origin": "TOPLEFT"
},
"text": "chitecture that are being pursued for state-of-the-art table-",
"orig": "chitecture that are being pursued for state-of-the-art table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 450.07,
"r_x1": 401.29,
"r_y1": 450.07,
"r_x2": 401.29,
"r_y2": 441.17,
"r_x3": 308.86,
"r_y3": 441.17,
"coord_origin": "TOPLEFT"
},
"text": "structure identification.",
"orig": "structure identification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification."
},
{
"label": "text",
"id": 3,
"page_no": 1,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 453.07,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 462.02,
"r_x1": 423.26,
"r_y1": 462.02,
"r_x2": 423.26,
"r_y2": 453.07,
"r_x3": 320.82,
"r_y3": 453.07,
"coord_origin": "TOPLEFT"
},
"text": "Image-to-Text networks",
"orig": "Image-to-Text networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.27,
"r_y0": 462.09,
"r_x1": 545.11,
"r_y1": 462.09,
"r_x2": 545.11,
"r_y2": 453.19,
"r_x3": 423.27,
"r_y3": 453.19,
"coord_origin": "TOPLEFT"
},
"text": ": In this type of network, one",
"orig": ": In this type of network, one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 474.05,
"r_x1": 545.12,
"r_y1": 474.05,
"r_x2": 545.12,
"r_y2": 465.14,
"r_x3": 308.86,
"r_y3": 465.14,
"coord_origin": "TOPLEFT"
},
"text": "predicts a sequence of tokens starting from an encoded",
"orig": "predicts a sequence of tokens starting from an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 486.0,
"r_x1": 335.7,
"r_y1": 486.0,
"r_x2": 335.7,
"r_y2": 477.1,
"r_x3": 308.86,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.85,
"r_y0": 486.0,
"r_x1": 545.12,
"r_y1": 486.0,
"r_x2": 545.12,
"r_y2": 477.1,
"r_x3": 345.85,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "Such sequences of tokens can be HTML table",
"orig": "Such sequences of tokens can be HTML table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.96,
"r_x1": 545.11,
"r_y1": 497.96,
"r_x2": 545.11,
"r_y2": 489.05,
"r_x3": 308.86,
"r_y3": 489.05,
"coord_origin": "TOPLEFT"
},
"text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.91,
"r_x1": 545.11,
"r_y1": 509.91,
"r_x2": 545.11,
"r_y2": 501.01,
"r_x3": 308.86,
"r_y3": 501.01,
"coord_origin": "TOPLEFT"
},
"text": "bols is ultimately not very important, since one can be trans-",
"orig": "bols is ultimately not very important, since one can be trans-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.87,
"r_x1": 545.12,
"r_y1": 521.87,
"r_x2": 545.12,
"r_y2": 512.96,
"r_x3": 308.86,
"r_y3": 512.96,
"coord_origin": "TOPLEFT"
},
"text": "formed into the other. There are however subtle variations",
"orig": "formed into the other. There are however subtle variations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.82,
"r_x1": 545.12,
"r_y1": 533.82,
"r_x2": 545.12,
"r_y2": 524.92,
"r_x3": 308.86,
"r_y3": 524.92,
"coord_origin": "TOPLEFT"
},
"text": "in the Image-to-Text networks. The easiest network archi-",
"orig": "in the Image-to-Text networks. The easiest network archi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.78,
"r_x1": 420.94,
"r_y1": 545.78,
"r_x2": 420.94,
"r_y2": 536.87,
"r_x3": 308.86,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "tectures are \u201cimage-encoder",
"orig": "tectures are \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.59,
"r_y0": 545.56,
"r_x1": 433.56,
"r_y1": 545.56,
"r_x2": 433.56,
"r_y2": 536.16,
"r_x3": 423.59,
"r_y3": 536.16,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.21,
"r_y0": 545.78,
"r_x1": 545.11,
"r_y1": 545.78,
"r_x2": 545.11,
"r_y2": 536.87,
"r_x3": 436.21,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "text-decoder\u201d (IETD), sim-",
"orig": "text-decoder\u201d (IETD), sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.73,
"r_x1": 545.12,
"r_y1": 557.73,
"r_x2": 545.12,
"r_y2": 548.83,
"r_x3": 308.86,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "ilar to network architectures that try to provide captions to",
"orig": "ilar to network architectures that try to provide captions to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.69,
"r_x1": 545.11,
"r_y1": 569.69,
"r_x2": 545.11,
"r_y2": 560.78,
"r_x3": 308.86,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "images [32]. In these IETD networks, one expects as output",
"orig": "images [32]. In these IETD networks, one expects as output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.64,
"r_x1": 545.11,
"r_y1": 581.64,
"r_x2": 545.11,
"r_y2": 572.74,
"r_x3": 308.86,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"orig": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.6,
"r_x1": 545.12,
"r_y1": 593.6,
"r_x2": 545.12,
"r_y2": 584.69,
"r_x3": 308.86,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "bols necessary for creating the table with the content of the",
"orig": "bols necessary for creating the table with the content of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.56,
"r_x1": 497.08,
"r_y1": 605.56,
"r_x2": 497.08,
"r_y2": 596.65,
"r_x3": 308.86,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "table. Another approach is the \u201cimage-encoder",
"orig": "table. Another approach is the \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.8,
"r_y0": 605.34,
"r_x1": 509.77,
"r_y1": 605.34,
"r_x2": 509.77,
"r_y2": 595.93,
"r_x3": 499.8,
"r_y3": 595.93,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.5,
"r_y0": 605.56,
"r_x1": 545.11,
"r_y1": 605.56,
"r_x2": 545.11,
"r_y2": 596.65,
"r_x3": 512.5,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "dual de-",
"orig": "dual de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.51,
"r_x1": 545.12,
"r_y1": 617.51,
"r_x2": 545.12,
"r_y2": 608.6,
"r_x3": 308.86,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "coder\u201d (IEDD) networks. In these type of networks, one has",
"orig": "coder\u201d (IEDD) networks. In these type of networks, one has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.47,
"r_x1": 545.12,
"r_y1": 629.47,
"r_x2": 545.12,
"r_y2": 620.56,
"r_x3": 308.86,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "two consecutive decoders with different purposes. The first",
"orig": "two consecutive decoders with different purposes. The first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.42,
"r_x1": 364.78,
"r_y1": 641.42,
"r_x2": 364.78,
"r_y2": 632.51,
"r_x3": 308.86,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "decoder is the",
"orig": "decoder is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.57,
"r_y0": 641.19,
"r_x1": 415.61,
"r_y1": 641.19,
"r_x2": 415.61,
"r_y2": 632.6,
"r_x3": 367.57,
"r_y3": 632.6,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.61,
"r_y0": 641.42,
"r_x1": 545.12,
"r_y1": 641.42,
"r_x2": 545.12,
"r_y2": 632.51,
"r_x3": 415.61,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": ", i.e. it only produces the HTM-",
"orig": ", i.e. it only produces the HTM-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.38,
"r_x1": 545.12,
"r_y1": 653.38,
"r_x2": 545.12,
"r_y2": 644.47,
"r_x3": 308.86,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "L/LaTeX tags which construct an empty table. The second",
"orig": "L/LaTeX tags which construct an empty table. The second",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.1,
"r_x1": 373.6,
"r_y1": 665.1,
"r_x2": 373.6,
"r_y2": 656.51,
"r_x3": 308.86,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "content-decoder",
"orig": "content-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.91,
"r_y0": 665.33,
"r_x1": 545.12,
"r_y1": 665.33,
"r_x2": 545.12,
"r_y2": 656.43,
"r_x3": 376.91,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "uses the encoding of the image in combi-",
"orig": "uses the encoding of the image in combi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.12,
"r_y1": 677.29,
"r_x2": 545.12,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "nation with the output encoding of each cell-tag (from the",
"orig": "nation with the output encoding of each cell-tag (from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.01,
"r_x1": 356.9,
"r_y1": 689.01,
"r_x2": 356.9,
"r_y2": 680.42,
"r_x3": 308.86,
"r_y3": 680.42,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.13,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 357.13,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": ") to generate the textual content of each table",
"orig": ") to generate the textual content of each table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "cell. The network architecture of IEDD is certainly more",
"orig": "cell. The network architecture of IEDD is certainly more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "elaborate, but it has the advantage that one can pre-train the",
"orig": "elaborate, but it has the advantage that one can pre-train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are \"image-encoder \u2192 text-decoder\" (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the \"image-encoder \u2192 dual decoder\" (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the"
}
],
"headers": [
{
"label": "page_footer",
"id": 15,
"page_no": 1,
"cluster": {
"id": 15,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.878,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2"
}
]
}
},
{
"page_no": 2,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 250.15,
"r_y1": 84.11,
"r_x2": 250.15,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder which is constrained to the table-tags.",
"orig": "tag-decoder which is constrained to the table-tags.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 96.13,
"r_x1": 70.37,
"r_y1": 96.13,
"r_x2": 70.37,
"r_y2": 87.22,
"r_x3": 62.07,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.93,
"r_y0": 96.13,
"r_x1": 110.95,
"r_y1": 96.13,
"r_x2": 110.95,
"r_y2": 87.22,
"r_x3": 76.93,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "practice,",
"orig": "practice,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.54,
"r_y0": 96.13,
"r_x1": 136.26,
"r_y1": 96.13,
"r_x2": 136.26,
"r_y2": 87.22,
"r_x3": 118.54,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "both",
"orig": "both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.82,
"r_y0": 96.13,
"r_x1": 175.37,
"r_y1": 96.13,
"r_x2": 175.37,
"r_y2": 87.22,
"r_x3": 142.82,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "network",
"orig": "network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.95,
"r_y0": 96.13,
"r_x1": 232.84,
"r_y1": 96.13,
"r_x2": 232.84,
"r_y2": 87.22,
"r_x3": 181.95,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "architectures",
"orig": "architectures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.41,
"r_y0": 96.13,
"r_x1": 265.41,
"r_y1": 96.13,
"r_x2": 265.41,
"r_y2": 87.22,
"r_x3": 239.41,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "(IETD",
"orig": "(IETD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 271.98,
"r_y0": 96.13,
"r_x1": 286.36,
"r_y1": 96.13,
"r_x2": 286.36,
"r_y2": 87.22,
"r_x3": 271.98,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.08,
"r_x1": 286.37,
"r_y1": 108.08,
"r_x2": 286.37,
"r_y2": 99.17,
"r_x3": 50.11,
"r_y3": 99.17,
"coord_origin": "TOPLEFT"
},
"text": "IEDD) require an implicit, custom trained object-character-",
"orig": "IEDD) require an implicit, custom trained object-character-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 120.04,
"r_x1": 286.37,
"r_y1": 120.04,
"r_x2": 286.37,
"r_y2": 111.13,
"r_x3": 50.11,
"r_y3": 111.13,
"coord_origin": "TOPLEFT"
},
"text": "recognition (OCR) to obtain the content of the table-cells.",
"orig": "recognition (OCR) to obtain the content of the table-cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.99,
"r_x1": 286.37,
"r_y1": 131.99,
"r_x2": 286.37,
"r_y2": 123.09,
"r_x3": 50.11,
"r_y3": 123.09,
"coord_origin": "TOPLEFT"
},
"text": "In the case of IETD, this OCR engine is implicit in the de-",
"orig": "In the case of IETD, this OCR engine is implicit in the de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 143.95,
"r_x1": 286.37,
"r_y1": 143.95,
"r_x2": 286.37,
"r_y2": 135.04,
"r_x3": 50.11,
"r_y3": 135.04,
"coord_origin": "TOPLEFT"
},
"text": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"orig": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 155.9,
"r_x1": 286.37,
"r_y1": 155.9,
"r_x2": 286.37,
"r_y2": 147.0,
"r_x3": 50.11,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "bedded in the content-decoder. This reliance on a custom,",
"orig": "bedded in the content-decoder. This reliance on a custom,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 167.86,
"r_x1": 286.37,
"r_y1": 167.86,
"r_x2": 286.37,
"r_y2": 158.95,
"r_x3": 50.11,
"r_y3": 158.95,
"coord_origin": "TOPLEFT"
},
"text": "implicit OCR decoder is of course problematic. OCR is a",
"orig": "implicit OCR decoder is of course problematic. OCR is a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 179.81,
"r_x1": 286.37,
"r_y1": 179.81,
"r_x2": 286.37,
"r_y2": 170.91,
"r_x3": 50.11,
"r_y3": 170.91,
"coord_origin": "TOPLEFT"
},
"text": "well known and extremely tough problem, that often needs",
"orig": "well known and extremely tough problem, that often needs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 191.77,
"r_x1": 286.37,
"r_y1": 191.77,
"r_x2": 286.37,
"r_y2": 182.86,
"r_x3": 50.11,
"r_y3": 182.86,
"coord_origin": "TOPLEFT"
},
"text": "custom training for each individual language. However, the",
"orig": "custom training for each individual language. However, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 203.72,
"r_x1": 286.37,
"r_y1": 203.72,
"r_x2": 286.37,
"r_y2": 194.82,
"r_x3": 50.11,
"r_y3": 194.82,
"coord_origin": "TOPLEFT"
},
"text": "limited availability for non-english content in the current",
"orig": "limited availability for non-english content in the current",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 215.68,
"r_x1": 286.37,
"r_y1": 215.68,
"r_x2": 286.37,
"r_y2": 206.77,
"r_x3": 50.11,
"r_y3": 206.77,
"coord_origin": "TOPLEFT"
},
"text": "datasets, makes it impractical to apply the IETD and IEDD",
"orig": "datasets, makes it impractical to apply the IETD and IEDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 227.63,
"r_x1": 286.37,
"r_y1": 227.63,
"r_x2": 286.37,
"r_y2": 218.73,
"r_x3": 50.11,
"r_y3": 218.73,
"coord_origin": "TOPLEFT"
},
"text": "methods on tables with other languages. Additionally, OCR",
"orig": "methods on tables with other languages. Additionally, OCR",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 239.59,
"r_x1": 286.37,
"r_y1": 239.59,
"r_x2": 286.37,
"r_y2": 230.68,
"r_x3": 50.11,
"r_y3": 230.68,
"coord_origin": "TOPLEFT"
},
"text": "can be completely omitted if the tables originate from pro-",
"orig": "can be completely omitted if the tables originate from pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 251.54,
"r_x1": 286.37,
"r_y1": 251.54,
"r_x2": 286.37,
"r_y2": 242.64,
"r_x3": 50.11,
"r_y3": 242.64,
"coord_origin": "TOPLEFT"
},
"text": "grammatic PDF documents with known positions of each",
"orig": "grammatic PDF documents with known positions of each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 263.5,
"r_x1": 286.37,
"r_y1": 263.5,
"r_x2": 286.37,
"r_y2": 254.59,
"r_x3": 50.11,
"r_y3": 254.59,
"coord_origin": "TOPLEFT"
},
"text": "cell. The latter was the inspiration for the work of this pa-",
"orig": "cell. The latter was the inspiration for the work of this pa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 275.45,
"r_x1": 64.78,
"r_y1": 275.45,
"r_x2": 64.78,
"r_y2": 266.55,
"r_x3": 50.11,
"r_y3": 266.55,
"coord_origin": "TOPLEFT"
},
"text": "per.",
"orig": "per.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 287.4,
"r_x1": 171.57,
"r_y1": 287.4,
"r_x2": 171.57,
"r_y2": 278.44,
"r_x3": 62.07,
"r_y3": 278.44,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.57,
"r_y0": 287.47,
"r_x1": 174.34,
"r_y1": 287.47,
"r_x2": 174.34,
"r_y2": 278.56,
"r_x3": 171.57,
"r_y3": 278.56,
"coord_origin": "TOPLEFT"
},
"text": ":",
"orig": ":",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.19,
"r_y0": 287.47,
"r_x1": 286.36,
"r_y1": 287.47,
"r_x2": 286.36,
"r_y2": 278.56,
"r_x3": 185.19,
"r_y3": 278.56,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 299.42,
"r_x1": 286.37,
"r_y1": 299.42,
"r_x2": 286.37,
"r_y2": 290.51,
"r_x3": 50.11,
"r_y3": 290.51,
"coord_origin": "TOPLEFT"
},
"text": "(GNN\u2019s) take a radically different approach to table-",
"orig": "(GNN\u2019s) take a radically different approach to table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 311.38,
"r_x1": 131.17,
"r_y1": 311.38,
"r_x2": 131.17,
"r_y2": 302.47,
"r_x3": 50.11,
"r_y3": 302.47,
"coord_origin": "TOPLEFT"
},
"text": "structure extraction.",
"orig": "structure extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.85,
"r_y0": 311.38,
"r_x1": 286.37,
"r_y1": 311.38,
"r_x2": 286.37,
"r_y2": 302.47,
"r_x3": 138.85,
"r_y3": 302.47,
"coord_origin": "TOPLEFT"
},
"text": "Note that one table cell can consti-",
"orig": "Note that one table cell can consti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 323.33,
"r_x1": 286.37,
"r_y1": 323.33,
"r_x2": 286.37,
"r_y2": 314.42,
"r_x3": 50.11,
"r_y3": 314.42,
"coord_origin": "TOPLEFT"
},
"text": "tute out of multiple text-cells. To obtain the table-structure,",
"orig": "tute out of multiple text-cells. To obtain the table-structure,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 335.29,
"r_x1": 286.37,
"r_y1": 335.29,
"r_x2": 286.37,
"r_y2": 326.38,
"r_x3": 50.11,
"r_y3": 326.38,
"coord_origin": "TOPLEFT"
},
"text": "one creates an initial graph, where each of the text-cells",
"orig": "one creates an initial graph, where each of the text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 347.24,
"r_x1": 286.37,
"r_y1": 347.24,
"r_x2": 286.37,
"r_y2": 338.33,
"r_x3": 50.11,
"r_y3": 338.33,
"coord_origin": "TOPLEFT"
},
"text": "becomes a node in the graph similar to [33, 34, 2]. Each",
"orig": "becomes a node in the graph similar to [33, 34, 2]. Each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.2,
"r_x1": 286.37,
"r_y1": 359.2,
"r_x2": 286.37,
"r_y2": 350.29,
"r_x3": 50.11,
"r_y3": 350.29,
"coord_origin": "TOPLEFT"
},
"text": "node is then associated with en embedding vector coming",
"orig": "node is then associated with en embedding vector coming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.15,
"r_x1": 286.37,
"r_y1": 371.15,
"r_x2": 286.37,
"r_y2": 362.25,
"r_x3": 50.11,
"r_y3": 362.25,
"coord_origin": "TOPLEFT"
},
"text": "from the encoded image, its coordinates and the encoded",
"orig": "from the encoded image, its coordinates and the encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 383.11,
"r_x1": 286.37,
"r_y1": 383.11,
"r_x2": 286.37,
"r_y2": 374.2,
"r_x3": 50.11,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "text. Furthermore, nodes that represent adjacent text-cells",
"orig": "text. Furthermore, nodes that represent adjacent text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 395.06,
"r_x1": 286.37,
"r_y1": 395.06,
"r_x2": 286.37,
"r_y2": 386.16,
"r_x3": 50.11,
"r_y3": 386.16,
"coord_origin": "TOPLEFT"
},
"text": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 407.02,
"r_x1": 286.37,
"r_y1": 407.02,
"r_x2": 286.37,
"r_y2": 398.11,
"r_x3": 50.11,
"r_y3": 398.11,
"coord_origin": "TOPLEFT"
},
"text": "methods take the image as an input, but also the position of",
"orig": "methods take the image as an input, but also the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 418.97,
"r_x1": 286.37,
"r_y1": 418.97,
"r_x2": 286.37,
"r_y2": 410.07,
"r_x3": 50.11,
"r_y3": 410.07,
"coord_origin": "TOPLEFT"
},
"text": "the text-cells and their content [18]. The purpose of a GCN",
"orig": "the text-cells and their content [18]. The purpose of a GCN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 430.93,
"r_x1": 286.37,
"r_y1": 430.93,
"r_x2": 286.37,
"r_y2": 422.02,
"r_x3": 50.11,
"r_y3": 422.02,
"coord_origin": "TOPLEFT"
},
"text": "is to transform the input graph into a new graph, which re-",
"orig": "is to transform the input graph into a new graph, which re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 442.88,
"r_x1": 198.24,
"r_y1": 442.88,
"r_x2": 198.24,
"r_y2": 433.98,
"r_x3": 50.11,
"r_y3": 433.98,
"coord_origin": "TOPLEFT"
},
"text": "places the old links with new ones.",
"orig": "places the old links with new ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.93,
"r_y0": 442.88,
"r_x1": 286.37,
"r_y1": 442.88,
"r_x2": 286.37,
"r_y2": 433.98,
"r_x3": 205.93,
"r_y3": 433.98,
"coord_origin": "TOPLEFT"
},
"text": "The new links then",
"orig": "The new links then",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 454.84,
"r_x1": 286.37,
"r_y1": 454.84,
"r_x2": 286.37,
"r_y2": 445.93,
"r_x3": 50.11,
"r_y3": 445.93,
"coord_origin": "TOPLEFT"
},
"text": "represent the table-structure. With this approach, one can",
"orig": "represent the table-structure. With this approach, one can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 466.79,
"r_x1": 286.37,
"r_y1": 466.79,
"r_x2": 286.37,
"r_y2": 457.89,
"r_x3": 50.11,
"r_y3": 457.89,
"coord_origin": "TOPLEFT"
},
"text": "avoid the need to build custom OCR decoders. However,",
"orig": "avoid the need to build custom OCR decoders. However,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 478.75,
"r_x1": 286.37,
"r_y1": 478.75,
"r_x2": 286.37,
"r_y2": 469.84,
"r_x3": 50.11,
"r_y3": 469.84,
"coord_origin": "TOPLEFT"
},
"text": "the quality of the reconstructed structure is not comparable",
"orig": "the quality of the reconstructed structure is not comparable",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 490.7,
"r_x1": 186.5,
"r_y1": 490.7,
"r_x2": 186.5,
"r_y2": 481.8,
"r_x3": 50.11,
"r_y3": 481.8,
"coord_origin": "TOPLEFT"
},
"text": "to the current state-of-the-art [18].",
"orig": "to the current state-of-the-art [18].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 502.65,
"r_x1": 252.88,
"r_y1": 502.65,
"r_x2": 252.88,
"r_y2": 493.69,
"r_x3": 62.07,
"r_y3": 493.69,
"coord_origin": "TOPLEFT"
},
"text": "Hybrid Deep Learning-Rule-Based approach",
"orig": "Hybrid Deep Learning-Rule-Based approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 252.88,
"r_y0": 502.71,
"r_x1": 286.37,
"r_y1": 502.71,
"r_x2": 286.37,
"r_y2": 493.81,
"r_x3": 252.88,
"r_y3": 493.81,
"coord_origin": "TOPLEFT"
},
"text": ": A pop-",
"orig": ": A pop-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 514.67,
"r_x1": 286.37,
"r_y1": 514.67,
"r_x2": 286.37,
"r_y2": 505.76,
"r_x3": 50.11,
"r_y3": 505.76,
"coord_origin": "TOPLEFT"
},
"text": "ular current model for table-structure identification is the",
"orig": "ular current model for table-structure identification is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 526.62,
"r_x1": 286.37,
"r_y1": 526.62,
"r_x2": 286.37,
"r_y2": 517.72,
"r_x3": 50.11,
"r_y3": 517.72,
"coord_origin": "TOPLEFT"
},
"text": "use of a hybrid Deep Learning-Rule-Based approach similar",
"orig": "use of a hybrid Deep Learning-Rule-Based approach similar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 538.58,
"r_x1": 286.37,
"r_y1": 538.58,
"r_x2": 286.37,
"r_y2": 529.67,
"r_x3": 50.11,
"r_y3": 529.67,
"coord_origin": "TOPLEFT"
},
"text": "to [27, 29]. In this approach, one first detects the position of",
"orig": "to [27, 29]. In this approach, one first detects the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 550.54,
"r_x1": 286.37,
"r_y1": 550.54,
"r_x2": 286.37,
"r_y2": 541.63,
"r_x3": 50.11,
"r_y3": 541.63,
"coord_origin": "TOPLEFT"
},
"text": "the table-cells with object detection (e.g. YoloVx or Mask-",
"orig": "the table-cells with object detection (e.g. YoloVx or Mask-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 562.49,
"r_x1": 286.37,
"r_y1": 562.49,
"r_x2": 286.37,
"r_y2": 553.58,
"r_x3": 50.11,
"r_y3": 553.58,
"coord_origin": "TOPLEFT"
},
"text": "RCNN), then classifies the table into different types (from",
"orig": "RCNN), then classifies the table into different types (from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 574.45,
"r_x1": 286.37,
"r_y1": 574.45,
"r_x2": 286.37,
"r_y2": 565.54,
"r_x3": 50.11,
"r_y3": 565.54,
"coord_origin": "TOPLEFT"
},
"text": "its images) and finally uses different rule-sets to obtain",
"orig": "its images) and finally uses different rule-sets to obtain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 586.4,
"r_x1": 286.37,
"r_y1": 586.4,
"r_x2": 286.37,
"r_y2": 577.49,
"r_x3": 50.11,
"r_y3": 577.49,
"coord_origin": "TOPLEFT"
},
"text": "its table-structure. Currently, this approach achieves state-",
"orig": "its table-structure. Currently, this approach achieves state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 598.36,
"r_x1": 286.37,
"r_y1": 598.36,
"r_x2": 286.37,
"r_y2": 589.45,
"r_x3": 50.11,
"r_y3": 589.45,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art results, but is not an end-to-end deep-learning",
"orig": "of-the-art results, but is not an end-to-end deep-learning",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 610.31,
"r_x1": 286.37,
"r_y1": 610.31,
"r_x2": 286.37,
"r_y2": 601.4,
"r_x3": 50.11,
"r_y3": 601.4,
"coord_origin": "TOPLEFT"
},
"text": "method. As such, new rules need to be written if different",
"orig": "method. As such, new rules need to be written if different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 622.27,
"r_x1": 175.99,
"r_y1": 622.27,
"r_x2": 175.99,
"r_y2": 613.36,
"r_x3": 50.11,
"r_y3": 613.36,
"coord_origin": "TOPLEFT"
},
"text": "types of tables are encountered.",
"orig": "types of tables are encountered.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 646.69,
"r_x1": 57.82,
"r_y1": 646.69,
"r_x2": 57.82,
"r_y2": 635.94,
"r_x3": 50.11,
"r_y3": 635.94,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.11,
"r_y0": 646.69,
"r_x1": 105.23,
"r_y1": 646.69,
"r_x2": 105.23,
"r_y2": 635.94,
"r_x3": 68.11,
"r_y3": 635.94,
"coord_origin": "TOPLEFT"
},
"text": "Datasets",
"orig": "Datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 665.33,
"r_x1": 286.36,
"r_y1": 665.33,
"r_x2": 286.36,
"r_y2": 656.43,
"r_x3": 62.07,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "We rely on large-scale datasets such as PubTabNet [37],",
"orig": "We rely on large-scale datasets such as PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] datasets to train and",
"orig": "FinTabNet [36], and TableBank [17] datasets to train and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "evaluate our models. These datasets span over various ap-",
"orig": "evaluate our models. These datasets span over various ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 166.25,
"r_y1": 701.2,
"r_x2": 166.25,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "pearance styles and content.",
"orig": "pearance styles and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 173.69,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 173.69,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "We also introduce our own",
"orig": "We also introduce our own",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "synthetically generated SynthTabNet dataset to fix an im-",
"orig": "synthetically generated SynthTabNet dataset to fix an im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.56,
"r_x1": 486.85,
"r_y1": 88.56,
"r_x2": 486.85,
"r_y2": 79.81,
"r_x3": 380.8,
"r_y3": 79.81,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.77,
"r_y0": 250.77,
"r_x1": 469.79,
"r_y1": 250.77,
"r_x2": 469.79,
"r_y2": 242.03,
"r_x3": 396.77,
"r_y3": 242.03,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.98,
"r_y0": 239.25,
"r_x1": 324.79,
"r_y1": 239.25,
"r_x2": 324.79,
"r_y2": 233.42,
"r_x3": 320.98,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.48,
"r_y0": 239.25,
"r_x1": 418.11,
"r_y1": 239.25,
"r_x2": 418.11,
"r_y2": 233.42,
"r_x3": 410.48,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.85,
"r_y0": 239.25,
"r_x1": 508.48,
"r_y1": 239.25,
"r_x2": 508.48,
"r_y2": 233.42,
"r_x3": 500.85,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.25,
"r_x1": 372.93,
"r_y1": 239.25,
"r_x2": 372.93,
"r_y2": 233.42,
"r_x3": 365.3,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.67,
"r_y0": 239.25,
"r_x1": 463.3,
"r_y1": 239.25,
"r_x2": 463.3,
"r_y2": 233.42,
"r_x3": 455.67,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.04,
"r_y0": 239.25,
"r_x1": 549.67,
"r_y1": 239.25,
"r_x2": 549.67,
"r_y2": 233.42,
"r_x3": 542.04,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.04,
"r_y0": 236.28,
"r_x1": 319.86,
"r_y1": 236.28,
"r_x2": 319.86,
"r_y2": 230.45,
"r_x3": 316.04,
"r_y3": 230.45,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.63,
"r_y0": 204.52,
"r_x1": 316.44,
"r_y1": 204.52,
"r_x2": 316.44,
"r_y2": 198.69,
"r_x3": 312.63,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.44,
"r_y0": 204.52,
"r_x1": 320.26,
"r_y1": 204.52,
"r_x2": 320.26,
"r_y2": 198.69,
"r_x3": 316.44,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.15,
"r_y0": 173.93,
"r_x1": 316.97,
"r_y1": 173.93,
"r_x2": 316.97,
"r_y2": 168.1,
"r_x3": 313.15,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.96,
"r_y0": 173.93,
"r_x1": 320.78,
"r_y1": 173.93,
"r_x2": 320.78,
"r_y2": 168.1,
"r_x3": 316.96,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.93,
"r_y0": 142.42,
"r_x1": 316.75,
"r_y1": 142.42,
"r_x2": 316.75,
"r_y2": 136.59,
"r_x3": 312.93,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.74,
"r_y0": 142.42,
"r_x1": 320.56,
"r_y1": 142.42,
"r_x2": 320.56,
"r_y2": 136.59,
"r_x3": 316.74,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 111.43,
"r_x1": 316.3,
"r_y1": 111.43,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.48,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.43,
"r_x1": 320.11,
"r_y1": 111.43,
"r_x2": 320.11,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 218.09,
"r_x1": 316.3,
"r_y1": 218.09,
"r_x2": 316.3,
"r_y2": 212.26,
"r_x3": 312.48,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.09,
"r_x1": 320.11,
"r_y1": 218.09,
"r_x2": 320.11,
"r_y2": 212.26,
"r_x3": 316.3,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.08,
"r_y0": 189.55,
"r_x1": 316.89,
"r_y1": 189.55,
"r_x2": 316.89,
"r_y2": 183.72,
"r_x3": 313.08,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.89,
"r_y0": 189.55,
"r_x1": 320.71,
"r_y1": 189.55,
"r_x2": 320.71,
"r_y2": 183.72,
"r_x3": 316.89,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.76,
"r_y0": 158.31,
"r_x1": 316.58,
"r_y1": 158.31,
"r_x2": 316.58,
"r_y2": 152.47,
"r_x3": 312.76,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.58,
"r_y0": 158.31,
"r_x1": 320.39,
"r_y1": 158.31,
"r_x2": 320.39,
"r_y2": 152.47,
"r_x3": 316.58,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.01,
"r_y1": 126.4,
"r_x2": 316.01,
"r_y2": 120.57,
"r_x3": 312.2,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.01,
"r_y0": 126.4,
"r_x1": 319.83,
"r_y1": 126.4,
"r_x2": 319.83,
"r_y2": 120.57,
"r_x3": 316.01,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.82,
"r_y0": 95.94,
"r_x1": 316.63,
"r_y1": 95.94,
"r_x2": 316.63,
"r_y2": 90.11,
"r_x3": 312.82,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.63,
"r_y0": 95.94,
"r_x1": 320.45,
"r_y1": 95.94,
"r_x2": 320.45,
"r_y2": 90.11,
"r_x3": 316.63,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.17,
"r_y0": 230.02,
"r_x1": 536.94,
"r_y1": 230.02,
"r_x2": 536.94,
"r_y2": 222.73,
"r_x3": 532.17,
"r_y3": 222.73,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.88,
"r_y0": 115.56,
"r_x1": 547.61,
"r_y1": 115.56,
"r_x2": 547.61,
"r_y2": 108.27,
"r_x3": 532.88,
"r_y3": 108.27,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.77,
"r_y0": 138.07,
"r_x1": 542.74,
"r_y1": 138.07,
"r_x2": 542.74,
"r_y2": 130.78,
"r_x3": 532.77,
"r_y3": 130.78,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.21,
"r_x1": 542.76,
"r_y1": 161.21,
"r_x2": 542.76,
"r_y2": 153.92,
"r_x3": 532.8,
"r_y3": 153.92,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.57,
"r_y0": 184.05,
"r_x1": 542.54,
"r_y1": 184.05,
"r_x2": 542.54,
"r_y2": 176.76,
"r_x3": 532.57,
"r_y3": 176.76,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.15,
"r_y0": 206.94,
"r_x1": 542.11,
"r_y1": 206.94,
"r_x2": 542.11,
"r_y2": 199.65,
"r_x3": 532.15,
"r_y3": 199.65,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 276.74,
"r_x1": 346.06,
"r_y1": 276.74,
"r_x2": 346.06,
"r_y2": 267.84,
"r_x3": 308.86,
"r_y3": 267.84,
"coord_origin": "TOPLEFT"
},
"text": "Figure 2:",
"orig": "Figure 2:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.49,
"r_y0": 276.74,
"r_x1": 545.12,
"r_y1": 276.74,
"r_x2": 545.12,
"r_y2": 267.84,
"r_x3": 354.49,
"r_y3": 267.84,
"coord_origin": "TOPLEFT"
},
"text": "Distribution of the tables across different table",
"orig": "Distribution of the tables across different table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 288.7,
"r_x1": 498.57,
"r_y1": 288.7,
"r_x2": 498.57,
"r_y2": 279.79,
"r_x3": 308.86,
"r_y3": 279.79,
"coord_origin": "TOPLEFT"
},
"text": "dimensions in PubTabNet + FinTabNet datasets",
"orig": "dimensions in PubTabNet + FinTabNet datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 326.38,
"r_x1": 437.27,
"r_y1": 326.38,
"r_x2": 437.27,
"r_y2": 317.47,
"r_x3": 308.86,
"r_y3": 317.47,
"coord_origin": "TOPLEFT"
},
"text": "balance in the previous datasets.",
"orig": "balance in the previous datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 340.44,
"r_x1": 545.12,
"r_y1": 340.44,
"r_x2": 545.12,
"r_y2": 331.53,
"r_x3": 320.82,
"r_y3": 331.53,
"coord_origin": "TOPLEFT"
},
"text": "The PubTabNet dataset contains 509k tables delivered as",
"orig": "The PubTabNet dataset contains 509k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 352.39,
"r_x1": 545.12,
"r_y1": 352.39,
"r_x2": 545.12,
"r_y2": 343.49,
"r_x3": 308.86,
"r_y3": 343.49,
"coord_origin": "TOPLEFT"
},
"text": "annotated PNG images. The annotations consist of the table",
"orig": "annotated PNG images. The annotations consist of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 364.35,
"r_x1": 545.12,
"r_y1": 364.35,
"r_x2": 545.12,
"r_y2": 355.44,
"r_x3": 308.86,
"r_y3": 355.44,
"coord_origin": "TOPLEFT"
},
"text": "structure represented in HTML format, the tokenized text",
"orig": "structure represented in HTML format, the tokenized text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 376.3,
"r_x1": 545.12,
"r_y1": 376.3,
"r_x2": 545.12,
"r_y2": 367.4,
"r_x3": 308.86,
"r_y3": 367.4,
"coord_origin": "TOPLEFT"
},
"text": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 388.26,
"r_x1": 545.12,
"r_y1": 388.26,
"r_x2": 545.12,
"r_y2": 379.35,
"r_x3": 308.86,
"r_y3": 379.35,
"coord_origin": "TOPLEFT"
},
"text": "pearance style of PubTabNet. Depending on its complexity,",
"orig": "pearance style of PubTabNet. Depending on its complexity,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.21,
"r_x1": 545.12,
"r_y1": 400.21,
"r_x2": 545.12,
"r_y2": 391.31,
"r_x3": 308.86,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "a table is characterized as \u201csimple\u201d when it does not contain",
"orig": "a table is characterized as \u201csimple\u201d when it does not contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.17,
"r_x1": 545.12,
"r_y1": 412.17,
"r_x2": 545.12,
"r_y2": 403.26,
"r_x3": 308.86,
"r_y3": 403.26,
"coord_origin": "TOPLEFT"
},
"text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.12,
"r_x1": 545.12,
"r_y1": 424.12,
"r_x2": 545.12,
"r_y2": 415.22,
"r_x3": 308.86,
"r_y3": 415.22,
"coord_origin": "TOPLEFT"
},
"text": "dataset is divided into Train and Val splits (roughly 98% and",
"orig": "dataset is divided into Train and Val splits (roughly 98% and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.08,
"r_x1": 545.12,
"r_y1": 436.08,
"r_x2": 545.12,
"r_y2": 427.17,
"r_x3": 308.86,
"r_y3": 427.17,
"coord_origin": "TOPLEFT"
},
"text": "2%). The Train split consists of 54% simple and 46% com-",
"orig": "2%). The Train split consists of 54% simple and 46% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.03,
"r_x1": 545.12,
"r_y1": 448.03,
"r_x2": 545.12,
"r_y2": 439.13,
"r_x3": 308.86,
"r_y3": 439.13,
"coord_origin": "TOPLEFT"
},
"text": "plex tables and the Val split of 51% and 49% respectively.",
"orig": "plex tables and the Val split of 51% and 49% respectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 459.99,
"r_x1": 545.12,
"r_y1": 459.99,
"r_x2": 545.12,
"r_y2": 451.08,
"r_x3": 308.86,
"r_y3": 451.08,
"coord_origin": "TOPLEFT"
},
"text": "The FinTabNet dataset contains 112k tables delivered as",
"orig": "The FinTabNet dataset contains 112k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 471.94,
"r_x1": 545.12,
"r_y1": 471.94,
"r_x2": 545.12,
"r_y2": 463.04,
"r_x3": 308.86,
"r_y3": 463.04,
"coord_origin": "TOPLEFT"
},
"text": "single-page PDF documents with mixed table structures and",
"orig": "single-page PDF documents with mixed table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 483.9,
"r_x1": 545.12,
"r_y1": 483.9,
"r_x2": 545.12,
"r_y2": 474.99,
"r_x3": 308.86,
"r_y3": 474.99,
"coord_origin": "TOPLEFT"
},
"text": "text content. Similarly to the PubTabNet, the annotations",
"orig": "text content. Similarly to the PubTabNet, the annotations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 495.86,
"r_x1": 545.12,
"r_y1": 495.86,
"r_x2": 545.12,
"r_y2": 486.95,
"r_x3": 308.86,
"r_y3": 486.95,
"coord_origin": "TOPLEFT"
},
"text": "of FinTabNet include the table structure in HTML, the to-",
"orig": "of FinTabNet include the table structure in HTML, the to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 507.81,
"r_x1": 545.12,
"r_y1": 507.81,
"r_x2": 545.12,
"r_y2": 498.9,
"r_x3": 308.86,
"r_y3": 498.9,
"coord_origin": "TOPLEFT"
},
"text": "kenized text and the bounding boxes on a table cell basis.",
"orig": "kenized text and the bounding boxes on a table cell basis.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 519.77,
"r_x1": 545.12,
"r_y1": 519.77,
"r_x2": 545.12,
"r_y2": 510.86,
"r_x3": 308.86,
"r_y3": 510.86,
"coord_origin": "TOPLEFT"
},
"text": "The dataset is divided into Train, Test and Val splits (81%,",
"orig": "The dataset is divided into Train, Test and Val splits (81%,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 531.72,
"r_x1": 545.12,
"r_y1": 531.72,
"r_x2": 545.12,
"r_y2": 522.81,
"r_x3": 308.86,
"r_y3": 522.81,
"coord_origin": "TOPLEFT"
},
"text": "9.5%, 9.5%), and each one is almost equally divided into",
"orig": "9.5%, 9.5%), and each one is almost equally divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 543.68,
"r_x1": 545.12,
"r_y1": 543.68,
"r_x2": 545.12,
"r_y2": 534.77,
"r_x3": 308.86,
"r_y3": 534.77,
"coord_origin": "TOPLEFT"
},
"text": "simple and complex tables (Train: 48% simple, 52% com-",
"orig": "simple and complex tables (Train: 48% simple, 52% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 555.63,
"r_x1": 545.12,
"r_y1": 555.63,
"r_x2": 545.12,
"r_y2": 546.72,
"r_x3": 308.86,
"r_y3": 546.72,
"coord_origin": "TOPLEFT"
},
"text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 567.59,
"r_x1": 545.12,
"r_y1": 567.59,
"r_x2": 545.12,
"r_y2": 558.68,
"r_x3": 308.86,
"r_y3": 558.68,
"coord_origin": "TOPLEFT"
},
"text": "47% complex). Finally the TableBank dataset consists of",
"orig": "47% complex). Finally the TableBank dataset consists of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 579.54,
"r_x1": 545.12,
"r_y1": 579.54,
"r_x2": 545.12,
"r_y2": 570.64,
"r_x3": 308.86,
"r_y3": 570.64,
"coord_origin": "TOPLEFT"
},
"text": "145k tables provided as JPEG images. The latter has anno-",
"orig": "145k tables provided as JPEG images. The latter has anno-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 591.5,
"r_x1": 545.11,
"r_y1": 591.5,
"r_x2": 545.11,
"r_y2": 582.59,
"r_x3": 308.86,
"r_y3": 582.59,
"coord_origin": "TOPLEFT"
},
"text": "tations for the table structure, but only few with bounding",
"orig": "tations for the table structure, but only few with bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 603.45,
"r_x1": 545.12,
"r_y1": 603.45,
"r_x2": 545.12,
"r_y2": 594.55,
"r_x3": 308.86,
"r_y3": 594.55,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the table cells. The entire dataset consists of sim-",
"orig": "boxes of the table cells. The entire dataset consists of sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 615.41,
"r_x1": 545.12,
"r_y1": 615.41,
"r_x2": 545.12,
"r_y2": 606.5,
"r_x3": 308.86,
"r_y3": 606.5,
"coord_origin": "TOPLEFT"
},
"text": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"orig": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 627.36,
"r_x1": 348.16,
"r_y1": 627.36,
"r_x2": 348.16,
"r_y2": 618.46,
"r_x3": 308.86,
"r_y3": 618.46,
"coord_origin": "TOPLEFT"
},
"text": "Val splits.",
"orig": "Val splits.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 641.42,
"r_x1": 545.11,
"r_y1": 641.42,
"r_x2": 545.11,
"r_y2": 632.51,
"r_x3": 320.82,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "Due to the heterogeneity across the dataset formats, it",
"orig": "Due to the heterogeneity across the dataset formats, it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.38,
"r_x1": 545.12,
"r_y1": 653.38,
"r_x2": 545.12,
"r_y2": 644.47,
"r_x3": 308.86,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "was necessary to combine all available data into one homog-",
"orig": "was necessary to combine all available data into one homog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.33,
"r_x1": 545.12,
"r_y1": 665.33,
"r_x2": 545.12,
"r_y2": 656.42,
"r_x3": 308.86,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "enized dataset before we could train our models for practi-",
"orig": "enized dataset before we could train our models for practi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "cal purposes. Given the size of PubTabNet, we adopted its",
"orig": "cal purposes. Given the size of PubTabNet, we adopted its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "annotation format and we extracted and converted all tables",
"orig": "annotation format and we extracted and converted all tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "as PNG images with a resolution of 72 dpi. Additionally,",
"orig": "as PNG images with a resolution of 72 dpi. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "we have filtered out tables with extreme sizes due to small",
"orig": "we have filtered out tables with extreme sizes due to small",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 250.15,
"b": 84.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 250.15,
"r_y1": 84.11,
"r_x2": 250.15,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder which is constrained to the table-tags.",
"orig": "tag-decoder which is constrained to the table-tags.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 87.22,
"r": 286.37,
"b": 275.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 96.13,
"r_x1": 70.37,
"r_y1": 96.13,
"r_x2": 70.37,
"r_y2": 87.22,
"r_x3": 62.07,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.93,
"r_y0": 96.13,
"r_x1": 110.95,
"r_y1": 96.13,
"r_x2": 110.95,
"r_y2": 87.22,
"r_x3": 76.93,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "practice,",
"orig": "practice,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.54,
"r_y0": 96.13,
"r_x1": 136.26,
"r_y1": 96.13,
"r_x2": 136.26,
"r_y2": 87.22,
"r_x3": 118.54,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "both",
"orig": "both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.82,
"r_y0": 96.13,
"r_x1": 175.37,
"r_y1": 96.13,
"r_x2": 175.37,
"r_y2": 87.22,
"r_x3": 142.82,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "network",
"orig": "network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.95,
"r_y0": 96.13,
"r_x1": 232.84,
"r_y1": 96.13,
"r_x2": 232.84,
"r_y2": 87.22,
"r_x3": 181.95,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "architectures",
"orig": "architectures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.41,
"r_y0": 96.13,
"r_x1": 265.41,
"r_y1": 96.13,
"r_x2": 265.41,
"r_y2": 87.22,
"r_x3": 239.41,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "(IETD",
"orig": "(IETD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 271.98,
"r_y0": 96.13,
"r_x1": 286.36,
"r_y1": 96.13,
"r_x2": 286.36,
"r_y2": 87.22,
"r_x3": 271.98,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.08,
"r_x1": 286.37,
"r_y1": 108.08,
"r_x2": 286.37,
"r_y2": 99.17,
"r_x3": 50.11,
"r_y3": 99.17,
"coord_origin": "TOPLEFT"
},
"text": "IEDD) require an implicit, custom trained object-character-",
"orig": "IEDD) require an implicit, custom trained object-character-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 120.04,
"r_x1": 286.37,
"r_y1": 120.04,
"r_x2": 286.37,
"r_y2": 111.13,
"r_x3": 50.11,
"r_y3": 111.13,
"coord_origin": "TOPLEFT"
},
"text": "recognition (OCR) to obtain the content of the table-cells.",
"orig": "recognition (OCR) to obtain the content of the table-cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.99,
"r_x1": 286.37,
"r_y1": 131.99,
"r_x2": 286.37,
"r_y2": 123.09,
"r_x3": 50.11,
"r_y3": 123.09,
"coord_origin": "TOPLEFT"
},
"text": "In the case of IETD, this OCR engine is implicit in the de-",
"orig": "In the case of IETD, this OCR engine is implicit in the de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 143.95,
"r_x1": 286.37,
"r_y1": 143.95,
"r_x2": 286.37,
"r_y2": 135.04,
"r_x3": 50.11,
"r_y3": 135.04,
"coord_origin": "TOPLEFT"
},
"text": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"orig": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 155.9,
"r_x1": 286.37,
"r_y1": 155.9,
"r_x2": 286.37,
"r_y2": 147.0,
"r_x3": 50.11,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "bedded in the content-decoder. This reliance on a custom,",
"orig": "bedded in the content-decoder. This reliance on a custom,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 167.86,
"r_x1": 286.37,
"r_y1": 167.86,
"r_x2": 286.37,
"r_y2": 158.95,
"r_x3": 50.11,
"r_y3": 158.95,
"coord_origin": "TOPLEFT"
},
"text": "implicit OCR decoder is of course problematic. OCR is a",
"orig": "implicit OCR decoder is of course problematic. OCR is a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 179.81,
"r_x1": 286.37,
"r_y1": 179.81,
"r_x2": 286.37,
"r_y2": 170.91,
"r_x3": 50.11,
"r_y3": 170.91,
"coord_origin": "TOPLEFT"
},
"text": "well known and extremely tough problem, that often needs",
"orig": "well known and extremely tough problem, that often needs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 191.77,
"r_x1": 286.37,
"r_y1": 191.77,
"r_x2": 286.37,
"r_y2": 182.86,
"r_x3": 50.11,
"r_y3": 182.86,
"coord_origin": "TOPLEFT"
},
"text": "custom training for each individual language. However, the",
"orig": "custom training for each individual language. However, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 203.72,
"r_x1": 286.37,
"r_y1": 203.72,
"r_x2": 286.37,
"r_y2": 194.82,
"r_x3": 50.11,
"r_y3": 194.82,
"coord_origin": "TOPLEFT"
},
"text": "limited availability for non-english content in the current",
"orig": "limited availability for non-english content in the current",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 215.68,
"r_x1": 286.37,
"r_y1": 215.68,
"r_x2": 286.37,
"r_y2": 206.77,
"r_x3": 50.11,
"r_y3": 206.77,
"coord_origin": "TOPLEFT"
},
"text": "datasets, makes it impractical to apply the IETD and IEDD",
"orig": "datasets, makes it impractical to apply the IETD and IEDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 227.63,
"r_x1": 286.37,
"r_y1": 227.63,
"r_x2": 286.37,
"r_y2": 218.73,
"r_x3": 50.11,
"r_y3": 218.73,
"coord_origin": "TOPLEFT"
},
"text": "methods on tables with other languages. Additionally, OCR",
"orig": "methods on tables with other languages. Additionally, OCR",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 239.59,
"r_x1": 286.37,
"r_y1": 239.59,
"r_x2": 286.37,
"r_y2": 230.68,
"r_x3": 50.11,
"r_y3": 230.68,
"coord_origin": "TOPLEFT"
},
"text": "can be completely omitted if the tables originate from pro-",
"orig": "can be completely omitted if the tables originate from pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 251.54,
"r_x1": 286.37,
"r_y1": 251.54,
"r_x2": 286.37,
"r_y2": 242.64,
"r_x3": 50.11,
"r_y3": 242.64,
"coord_origin": "TOPLEFT"
},
"text": "grammatic PDF documents with known positions of each",
"orig": "grammatic PDF documents with known positions of each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 263.5,
"r_x1": 286.37,
"r_y1": 263.5,
"r_x2": 286.37,
"r_y2": 254.59,
"r_x3": 50.11,
"r_y3": 254.59,
"coord_origin": "TOPLEFT"
},
"text": "cell. The latter was the inspiration for the work of this pa-",
"orig": "cell. The latter was the inspiration for the work of this pa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 275.45,
"r_x1": 64.78,
"r_y1": 275.45,
"r_x2": 64.78,
"r_y2": 266.55,
"r_x3": 50.11,
"r_y3": 266.55,
"coord_origin": "TOPLEFT"
},
"text": "per.",
"orig": "per.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 278.44,
"r": 286.37,
"b": 490.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 287.4,
"r_x1": 171.57,
"r_y1": 287.4,
"r_x2": 171.57,
"r_y2": 278.44,
"r_x3": 62.07,
"r_y3": 278.44,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.57,
"r_y0": 287.47,
"r_x1": 174.34,
"r_y1": 287.47,
"r_x2": 174.34,
"r_y2": 278.56,
"r_x3": 171.57,
"r_y3": 278.56,
"coord_origin": "TOPLEFT"
},
"text": ":",
"orig": ":",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.19,
"r_y0": 287.47,
"r_x1": 286.36,
"r_y1": 287.47,
"r_x2": 286.36,
"r_y2": 278.56,
"r_x3": 185.19,
"r_y3": 278.56,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 299.42,
"r_x1": 286.37,
"r_y1": 299.42,
"r_x2": 286.37,
"r_y2": 290.51,
"r_x3": 50.11,
"r_y3": 290.51,
"coord_origin": "TOPLEFT"
},
"text": "(GNN\u2019s) take a radically different approach to table-",
"orig": "(GNN\u2019s) take a radically different approach to table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 311.38,
"r_x1": 131.17,
"r_y1": 311.38,
"r_x2": 131.17,
"r_y2": 302.47,
"r_x3": 50.11,
"r_y3": 302.47,
"coord_origin": "TOPLEFT"
},
"text": "structure extraction.",
"orig": "structure extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.85,
"r_y0": 311.38,
"r_x1": 286.37,
"r_y1": 311.38,
"r_x2": 286.37,
"r_y2": 302.47,
"r_x3": 138.85,
"r_y3": 302.47,
"coord_origin": "TOPLEFT"
},
"text": "Note that one table cell can consti-",
"orig": "Note that one table cell can consti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 323.33,
"r_x1": 286.37,
"r_y1": 323.33,
"r_x2": 286.37,
"r_y2": 314.42,
"r_x3": 50.11,
"r_y3": 314.42,
"coord_origin": "TOPLEFT"
},
"text": "tute out of multiple text-cells. To obtain the table-structure,",
"orig": "tute out of multiple text-cells. To obtain the table-structure,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 335.29,
"r_x1": 286.37,
"r_y1": 335.29,
"r_x2": 286.37,
"r_y2": 326.38,
"r_x3": 50.11,
"r_y3": 326.38,
"coord_origin": "TOPLEFT"
},
"text": "one creates an initial graph, where each of the text-cells",
"orig": "one creates an initial graph, where each of the text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 347.24,
"r_x1": 286.37,
"r_y1": 347.24,
"r_x2": 286.37,
"r_y2": 338.33,
"r_x3": 50.11,
"r_y3": 338.33,
"coord_origin": "TOPLEFT"
},
"text": "becomes a node in the graph similar to [33, 34, 2]. Each",
"orig": "becomes a node in the graph similar to [33, 34, 2]. Each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.2,
"r_x1": 286.37,
"r_y1": 359.2,
"r_x2": 286.37,
"r_y2": 350.29,
"r_x3": 50.11,
"r_y3": 350.29,
"coord_origin": "TOPLEFT"
},
"text": "node is then associated with en embedding vector coming",
"orig": "node is then associated with en embedding vector coming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.15,
"r_x1": 286.37,
"r_y1": 371.15,
"r_x2": 286.37,
"r_y2": 362.25,
"r_x3": 50.11,
"r_y3": 362.25,
"coord_origin": "TOPLEFT"
},
"text": "from the encoded image, its coordinates and the encoded",
"orig": "from the encoded image, its coordinates and the encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 383.11,
"r_x1": 286.37,
"r_y1": 383.11,
"r_x2": 286.37,
"r_y2": 374.2,
"r_x3": 50.11,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "text. Furthermore, nodes that represent adjacent text-cells",
"orig": "text. Furthermore, nodes that represent adjacent text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 395.06,
"r_x1": 286.37,
"r_y1": 395.06,
"r_x2": 286.37,
"r_y2": 386.16,
"r_x3": 50.11,
"r_y3": 386.16,
"coord_origin": "TOPLEFT"
},
"text": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 407.02,
"r_x1": 286.37,
"r_y1": 407.02,
"r_x2": 286.37,
"r_y2": 398.11,
"r_x3": 50.11,
"r_y3": 398.11,
"coord_origin": "TOPLEFT"
},
"text": "methods take the image as an input, but also the position of",
"orig": "methods take the image as an input, but also the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 418.97,
"r_x1": 286.37,
"r_y1": 418.97,
"r_x2": 286.37,
"r_y2": 410.07,
"r_x3": 50.11,
"r_y3": 410.07,
"coord_origin": "TOPLEFT"
},
"text": "the text-cells and their content [18]. The purpose of a GCN",
"orig": "the text-cells and their content [18]. The purpose of a GCN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 430.93,
"r_x1": 286.37,
"r_y1": 430.93,
"r_x2": 286.37,
"r_y2": 422.02,
"r_x3": 50.11,
"r_y3": 422.02,
"coord_origin": "TOPLEFT"
},
"text": "is to transform the input graph into a new graph, which re-",
"orig": "is to transform the input graph into a new graph, which re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 442.88,
"r_x1": 198.24,
"r_y1": 442.88,
"r_x2": 198.24,
"r_y2": 433.98,
"r_x3": 50.11,
"r_y3": 433.98,
"coord_origin": "TOPLEFT"
},
"text": "places the old links with new ones.",
"orig": "places the old links with new ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.93,
"r_y0": 442.88,
"r_x1": 286.37,
"r_y1": 442.88,
"r_x2": 286.37,
"r_y2": 433.98,
"r_x3": 205.93,
"r_y3": 433.98,
"coord_origin": "TOPLEFT"
},
"text": "The new links then",
"orig": "The new links then",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 454.84,
"r_x1": 286.37,
"r_y1": 454.84,
"r_x2": 286.37,
"r_y2": 445.93,
"r_x3": 50.11,
"r_y3": 445.93,
"coord_origin": "TOPLEFT"
},
"text": "represent the table-structure. With this approach, one can",
"orig": "represent the table-structure. With this approach, one can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 466.79,
"r_x1": 286.37,
"r_y1": 466.79,
"r_x2": 286.37,
"r_y2": 457.89,
"r_x3": 50.11,
"r_y3": 457.89,
"coord_origin": "TOPLEFT"
},
"text": "avoid the need to build custom OCR decoders. However,",
"orig": "avoid the need to build custom OCR decoders. However,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 478.75,
"r_x1": 286.37,
"r_y1": 478.75,
"r_x2": 286.37,
"r_y2": 469.84,
"r_x3": 50.11,
"r_y3": 469.84,
"coord_origin": "TOPLEFT"
},
"text": "the quality of the reconstructed structure is not comparable",
"orig": "the quality of the reconstructed structure is not comparable",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 490.7,
"r_x1": 186.5,
"r_y1": 490.7,
"r_x2": 186.5,
"r_y2": 481.8,
"r_x3": 50.11,
"r_y3": 481.8,
"coord_origin": "TOPLEFT"
},
"text": "to the current state-of-the-art [18].",
"orig": "to the current state-of-the-art [18].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 493.69,
"r": 286.37,
"b": 622.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 502.65,
"r_x1": 252.88,
"r_y1": 502.65,
"r_x2": 252.88,
"r_y2": 493.69,
"r_x3": 62.07,
"r_y3": 493.69,
"coord_origin": "TOPLEFT"
},
"text": "Hybrid Deep Learning-Rule-Based approach",
"orig": "Hybrid Deep Learning-Rule-Based approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 252.88,
"r_y0": 502.71,
"r_x1": 286.37,
"r_y1": 502.71,
"r_x2": 286.37,
"r_y2": 493.81,
"r_x3": 252.88,
"r_y3": 493.81,
"coord_origin": "TOPLEFT"
},
"text": ": A pop-",
"orig": ": A pop-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 514.67,
"r_x1": 286.37,
"r_y1": 514.67,
"r_x2": 286.37,
"r_y2": 505.76,
"r_x3": 50.11,
"r_y3": 505.76,
"coord_origin": "TOPLEFT"
},
"text": "ular current model for table-structure identification is the",
"orig": "ular current model for table-structure identification is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 526.62,
"r_x1": 286.37,
"r_y1": 526.62,
"r_x2": 286.37,
"r_y2": 517.72,
"r_x3": 50.11,
"r_y3": 517.72,
"coord_origin": "TOPLEFT"
},
"text": "use of a hybrid Deep Learning-Rule-Based approach similar",
"orig": "use of a hybrid Deep Learning-Rule-Based approach similar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 538.58,
"r_x1": 286.37,
"r_y1": 538.58,
"r_x2": 286.37,
"r_y2": 529.67,
"r_x3": 50.11,
"r_y3": 529.67,
"coord_origin": "TOPLEFT"
},
"text": "to [27, 29]. In this approach, one first detects the position of",
"orig": "to [27, 29]. In this approach, one first detects the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 550.54,
"r_x1": 286.37,
"r_y1": 550.54,
"r_x2": 286.37,
"r_y2": 541.63,
"r_x3": 50.11,
"r_y3": 541.63,
"coord_origin": "TOPLEFT"
},
"text": "the table-cells with object detection (e.g. YoloVx or Mask-",
"orig": "the table-cells with object detection (e.g. YoloVx or Mask-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 562.49,
"r_x1": 286.37,
"r_y1": 562.49,
"r_x2": 286.37,
"r_y2": 553.58,
"r_x3": 50.11,
"r_y3": 553.58,
"coord_origin": "TOPLEFT"
},
"text": "RCNN), then classifies the table into different types (from",
"orig": "RCNN), then classifies the table into different types (from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 574.45,
"r_x1": 286.37,
"r_y1": 574.45,
"r_x2": 286.37,
"r_y2": 565.54,
"r_x3": 50.11,
"r_y3": 565.54,
"coord_origin": "TOPLEFT"
},
"text": "its images) and finally uses different rule-sets to obtain",
"orig": "its images) and finally uses different rule-sets to obtain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 586.4,
"r_x1": 286.37,
"r_y1": 586.4,
"r_x2": 286.37,
"r_y2": 577.49,
"r_x3": 50.11,
"r_y3": 577.49,
"coord_origin": "TOPLEFT"
},
"text": "its table-structure. Currently, this approach achieves state-",
"orig": "its table-structure. Currently, this approach achieves state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 598.36,
"r_x1": 286.37,
"r_y1": 598.36,
"r_x2": 286.37,
"r_y2": 589.45,
"r_x3": 50.11,
"r_y3": 589.45,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art results, but is not an end-to-end deep-learning",
"orig": "of-the-art results, but is not an end-to-end deep-learning",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 610.31,
"r_x1": 286.37,
"r_y1": 610.31,
"r_x2": 286.37,
"r_y2": 601.4,
"r_x3": 50.11,
"r_y3": 601.4,
"coord_origin": "TOPLEFT"
},
"text": "method. As such, new rules need to be written if different",
"orig": "method. As such, new rules need to be written if different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 622.27,
"r_x1": 175.99,
"r_y1": 622.27,
"r_x2": 175.99,
"r_y2": 613.36,
"r_x3": 50.11,
"r_y3": 613.36,
"coord_origin": "TOPLEFT"
},
"text": "types of tables are encountered.",
"orig": "types of tables are encountered.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 635.94,
"r": 105.23,
"b": 646.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 646.69,
"r_x1": 57.82,
"r_y1": 646.69,
"r_x2": 57.82,
"r_y2": 635.94,
"r_x3": 50.11,
"r_y3": 635.94,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.11,
"r_y0": 646.69,
"r_x1": 105.23,
"r_y1": 646.69,
"r_x2": 105.23,
"r_y2": 635.94,
"r_x3": 68.11,
"r_y3": 635.94,
"coord_origin": "TOPLEFT"
},
"text": "Datasets",
"orig": "Datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 656.43,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 665.33,
"r_x1": 286.36,
"r_y1": 665.33,
"r_x2": 286.36,
"r_y2": 656.43,
"r_x3": 62.07,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "We rely on large-scale datasets such as PubTabNet [37],",
"orig": "We rely on large-scale datasets such as PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] datasets to train and",
"orig": "FinTabNet [36], and TableBank [17] datasets to train and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "evaluate our models. These datasets span over various ap-",
"orig": "evaluate our models. These datasets span over various ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 166.25,
"r_y1": 701.2,
"r_x2": 166.25,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "pearance styles and content.",
"orig": "pearance styles and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 173.69,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 173.69,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "We also introduce our own",
"orig": "We also introduce our own",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "synthetically generated SynthTabNet dataset to fix an im-",
"orig": "synthetically generated SynthTabNet dataset to fix an im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "picture",
"bbox": {
"l": 312.1,
"t": 78.44,
"r": 550.39,
"b": 250.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.975,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.56,
"r_x1": 486.85,
"r_y1": 88.56,
"r_x2": 486.85,
"r_y2": 79.81,
"r_x3": 380.8,
"r_y3": 79.81,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.77,
"r_y0": 250.77,
"r_x1": 469.79,
"r_y1": 250.77,
"r_x2": 469.79,
"r_y2": 242.03,
"r_x3": 396.77,
"r_y3": 242.03,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.98,
"r_y0": 239.25,
"r_x1": 324.79,
"r_y1": 239.25,
"r_x2": 324.79,
"r_y2": 233.42,
"r_x3": 320.98,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.48,
"r_y0": 239.25,
"r_x1": 418.11,
"r_y1": 239.25,
"r_x2": 418.11,
"r_y2": 233.42,
"r_x3": 410.48,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.85,
"r_y0": 239.25,
"r_x1": 508.48,
"r_y1": 239.25,
"r_x2": 508.48,
"r_y2": 233.42,
"r_x3": 500.85,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.25,
"r_x1": 372.93,
"r_y1": 239.25,
"r_x2": 372.93,
"r_y2": 233.42,
"r_x3": 365.3,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.67,
"r_y0": 239.25,
"r_x1": 463.3,
"r_y1": 239.25,
"r_x2": 463.3,
"r_y2": 233.42,
"r_x3": 455.67,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.04,
"r_y0": 239.25,
"r_x1": 549.67,
"r_y1": 239.25,
"r_x2": 549.67,
"r_y2": 233.42,
"r_x3": 542.04,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.04,
"r_y0": 236.28,
"r_x1": 319.86,
"r_y1": 236.28,
"r_x2": 319.86,
"r_y2": 230.45,
"r_x3": 316.04,
"r_y3": 230.45,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.63,
"r_y0": 204.52,
"r_x1": 316.44,
"r_y1": 204.52,
"r_x2": 316.44,
"r_y2": 198.69,
"r_x3": 312.63,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.44,
"r_y0": 204.52,
"r_x1": 320.26,
"r_y1": 204.52,
"r_x2": 320.26,
"r_y2": 198.69,
"r_x3": 316.44,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.15,
"r_y0": 173.93,
"r_x1": 316.97,
"r_y1": 173.93,
"r_x2": 316.97,
"r_y2": 168.1,
"r_x3": 313.15,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.96,
"r_y0": 173.93,
"r_x1": 320.78,
"r_y1": 173.93,
"r_x2": 320.78,
"r_y2": 168.1,
"r_x3": 316.96,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.93,
"r_y0": 142.42,
"r_x1": 316.75,
"r_y1": 142.42,
"r_x2": 316.75,
"r_y2": 136.59,
"r_x3": 312.93,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.74,
"r_y0": 142.42,
"r_x1": 320.56,
"r_y1": 142.42,
"r_x2": 320.56,
"r_y2": 136.59,
"r_x3": 316.74,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 111.43,
"r_x1": 316.3,
"r_y1": 111.43,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.48,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.43,
"r_x1": 320.11,
"r_y1": 111.43,
"r_x2": 320.11,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 218.09,
"r_x1": 316.3,
"r_y1": 218.09,
"r_x2": 316.3,
"r_y2": 212.26,
"r_x3": 312.48,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.09,
"r_x1": 320.11,
"r_y1": 218.09,
"r_x2": 320.11,
"r_y2": 212.26,
"r_x3": 316.3,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.08,
"r_y0": 189.55,
"r_x1": 316.89,
"r_y1": 189.55,
"r_x2": 316.89,
"r_y2": 183.72,
"r_x3": 313.08,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.89,
"r_y0": 189.55,
"r_x1": 320.71,
"r_y1": 189.55,
"r_x2": 320.71,
"r_y2": 183.72,
"r_x3": 316.89,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.76,
"r_y0": 158.31,
"r_x1": 316.58,
"r_y1": 158.31,
"r_x2": 316.58,
"r_y2": 152.47,
"r_x3": 312.76,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.58,
"r_y0": 158.31,
"r_x1": 320.39,
"r_y1": 158.31,
"r_x2": 320.39,
"r_y2": 152.47,
"r_x3": 316.58,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.01,
"r_y1": 126.4,
"r_x2": 316.01,
"r_y2": 120.57,
"r_x3": 312.2,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.01,
"r_y0": 126.4,
"r_x1": 319.83,
"r_y1": 126.4,
"r_x2": 319.83,
"r_y2": 120.57,
"r_x3": 316.01,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.82,
"r_y0": 95.94,
"r_x1": 316.63,
"r_y1": 95.94,
"r_x2": 316.63,
"r_y2": 90.11,
"r_x3": 312.82,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.63,
"r_y0": 95.94,
"r_x1": 320.45,
"r_y1": 95.94,
"r_x2": 320.45,
"r_y2": 90.11,
"r_x3": 316.63,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.17,
"r_y0": 230.02,
"r_x1": 536.94,
"r_y1": 230.02,
"r_x2": 536.94,
"r_y2": 222.73,
"r_x3": 532.17,
"r_y3": 222.73,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.88,
"r_y0": 115.56,
"r_x1": 547.61,
"r_y1": 115.56,
"r_x2": 547.61,
"r_y2": 108.27,
"r_x3": 532.88,
"r_y3": 108.27,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.77,
"r_y0": 138.07,
"r_x1": 542.74,
"r_y1": 138.07,
"r_x2": 542.74,
"r_y2": 130.78,
"r_x3": 532.77,
"r_y3": 130.78,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.21,
"r_x1": 542.76,
"r_y1": 161.21,
"r_x2": 542.76,
"r_y2": 153.92,
"r_x3": 532.8,
"r_y3": 153.92,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.57,
"r_y0": 184.05,
"r_x1": 542.54,
"r_y1": 184.05,
"r_x2": 542.54,
"r_y2": 176.76,
"r_x3": 532.57,
"r_y3": 176.76,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.15,
"r_y0": 206.94,
"r_x1": 542.11,
"r_y1": 206.94,
"r_x2": 542.11,
"r_y2": 199.65,
"r_x3": 532.15,
"r_y3": 199.65,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 380.8,
"t": 79.81,
"r": 486.85,
"b": 88.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.569,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.56,
"r_x1": 486.85,
"r_y1": 88.56,
"r_x2": 486.85,
"r_y2": 79.81,
"r_x3": 380.8,
"r_y3": 79.81,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 396.77,
"t": 242.03,
"r": 469.79,
"b": 250.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.77,
"r_y0": 250.77,
"r_x1": 469.79,
"r_y1": 250.77,
"r_x2": 469.79,
"r_y2": 242.03,
"r_x3": 396.77,
"r_y3": 242.03,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "text",
"bbox": {
"l": 320.98,
"t": 233.42,
"r": 324.79,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.98,
"r_y0": 239.25,
"r_x1": 324.79,
"r_y1": 239.25,
"r_x2": 324.79,
"r_y2": 233.42,
"r_x3": 320.98,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 410.48,
"t": 233.42,
"r": 418.11,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.48,
"r_y0": 239.25,
"r_x1": 418.11,
"r_y1": 239.25,
"r_x2": 418.11,
"r_y2": 233.42,
"r_x3": 410.48,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 500.85,
"t": 233.42,
"r": 508.48,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.85,
"r_y0": 239.25,
"r_x1": 508.48,
"r_y1": 239.25,
"r_x2": 508.48,
"r_y2": 233.42,
"r_x3": 500.85,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 365.3,
"t": 233.42,
"r": 372.93,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.25,
"r_x1": 372.93,
"r_y1": 239.25,
"r_x2": 372.93,
"r_y2": 233.42,
"r_x3": 365.3,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 455.67,
"t": 233.42,
"r": 463.3,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.67,
"r_y0": 239.25,
"r_x1": 463.3,
"r_y1": 239.25,
"r_x2": 463.3,
"r_y2": 233.42,
"r_x3": 455.67,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 542.04,
"t": 233.42,
"r": 549.67,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.04,
"r_y0": 239.25,
"r_x1": 549.67,
"r_y1": 239.25,
"r_x2": 549.67,
"r_y2": 233.42,
"r_x3": 542.04,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 316.04,
"t": 230.45,
"r": 319.86,
"b": 236.28,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.04,
"r_y0": 236.28,
"r_x1": 319.86,
"r_y1": 236.28,
"r_x2": 319.86,
"r_y2": 230.45,
"r_x3": 316.04,
"r_y3": 230.45,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 312.63,
"t": 198.69,
"r": 316.44,
"b": 204.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.63,
"r_y0": 204.52,
"r_x1": 316.44,
"r_y1": 204.52,
"r_x2": 316.44,
"r_y2": 198.69,
"r_x3": 312.63,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 316.44,
"t": 198.69,
"r": 320.26,
"b": 204.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.44,
"r_y0": 204.52,
"r_x1": 320.26,
"r_y1": 204.52,
"r_x2": 320.26,
"r_y2": 198.69,
"r_x3": 316.44,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 313.15,
"t": 168.1,
"r": 316.97,
"b": 173.93,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.15,
"r_y0": 173.93,
"r_x1": 316.97,
"r_y1": 173.93,
"r_x2": 316.97,
"r_y2": 168.1,
"r_x3": 313.15,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 316.96,
"t": 168.1,
"r": 320.78,
"b": 173.93,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.96,
"r_y0": 173.93,
"r_x1": 320.78,
"r_y1": 173.93,
"r_x2": 320.78,
"r_y2": 168.1,
"r_x3": 316.96,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 312.93,
"t": 136.59,
"r": 316.75,
"b": 142.42,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.93,
"r_y0": 142.42,
"r_x1": 316.75,
"r_y1": 142.42,
"r_x2": 316.75,
"r_y2": 136.59,
"r_x3": 312.93,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 316.74,
"t": 136.59,
"r": 320.56,
"b": 142.42,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.74,
"r_y0": 142.42,
"r_x1": 320.56,
"r_y1": 142.42,
"r_x2": 320.56,
"r_y2": 136.59,
"r_x3": 316.74,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 312.48,
"t": 105.6,
"r": 316.3,
"b": 111.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 111.43,
"r_x1": 316.3,
"r_y1": 111.43,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.48,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 316.3,
"t": 105.6,
"r": 320.11,
"b": 111.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.43,
"r_x1": 320.11,
"r_y1": 111.43,
"r_x2": 320.11,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 312.48,
"t": 212.26,
"r": 316.3,
"b": 218.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 218.09,
"r_x1": 316.3,
"r_y1": 218.09,
"r_x2": 316.3,
"r_y2": 212.26,
"r_x3": 312.48,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 316.3,
"t": 212.26,
"r": 320.11,
"b": 218.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.09,
"r_x1": 320.11,
"r_y1": 218.09,
"r_x2": 320.11,
"r_y2": 212.26,
"r_x3": 316.3,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 313.08,
"t": 183.72,
"r": 316.89,
"b": 189.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.08,
"r_y0": 189.55,
"r_x1": 316.89,
"r_y1": 189.55,
"r_x2": 316.89,
"r_y2": 183.72,
"r_x3": 313.08,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 316.89,
"t": 183.72,
"r": 320.71,
"b": 189.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.89,
"r_y0": 189.55,
"r_x1": 320.71,
"r_y1": 189.55,
"r_x2": 320.71,
"r_y2": 183.72,
"r_x3": 316.89,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 312.76,
"t": 152.47,
"r": 316.58,
"b": 158.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.76,
"r_y0": 158.31,
"r_x1": 316.58,
"r_y1": 158.31,
"r_x2": 316.58,
"r_y2": 152.47,
"r_x3": 312.76,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 316.58,
"t": 152.47,
"r": 320.39,
"b": 158.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.58,
"r_y0": 158.31,
"r_x1": 320.39,
"r_y1": 158.31,
"r_x2": 320.39,
"r_y2": 152.47,
"r_x3": 316.58,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 312.2,
"t": 120.57,
"r": 316.01,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.01,
"r_y1": 126.4,
"r_x2": 316.01,
"r_y2": 120.57,
"r_x3": 312.2,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 316.01,
"t": 120.57,
"r": 319.83,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.01,
"r_y0": 126.4,
"r_x1": 319.83,
"r_y1": 126.4,
"r_x2": 319.83,
"r_y2": 120.57,
"r_x3": 316.01,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 312.82,
"t": 90.11,
"r": 316.63,
"b": 95.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.82,
"r_y0": 95.94,
"r_x1": 316.63,
"r_y1": 95.94,
"r_x2": 316.63,
"r_y2": 90.11,
"r_x3": 312.82,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 316.63,
"t": 90.11,
"r": 320.45,
"b": 95.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.63,
"r_y0": 95.94,
"r_x1": 320.45,
"r_y1": 95.94,
"r_x2": 320.45,
"r_y2": 90.11,
"r_x3": 316.63,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 532.17,
"t": 222.73,
"r": 536.94,
"b": 230.02,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.17,
"r_y0": 230.02,
"r_x1": 536.94,
"r_y1": 230.02,
"r_x2": 536.94,
"r_y2": 222.73,
"r_x3": 532.17,
"r_y3": 222.73,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 532.88,
"t": 108.27,
"r": 547.61,
"b": 115.56,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.88,
"r_y0": 115.56,
"r_x1": 547.61,
"r_y1": 115.56,
"r_x2": 547.61,
"r_y2": 108.27,
"r_x3": 532.88,
"r_y3": 108.27,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 532.77,
"t": 130.78,
"r": 542.74,
"b": 138.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.77,
"r_y0": 138.07,
"r_x1": 542.74,
"r_y1": 138.07,
"r_x2": 542.74,
"r_y2": 130.78,
"r_x3": 532.77,
"r_y3": 130.78,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 532.8,
"t": 153.92,
"r": 542.76,
"b": 161.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.21,
"r_x1": 542.76,
"r_y1": 161.21,
"r_x2": 542.76,
"r_y2": 153.92,
"r_x3": 532.8,
"r_y3": 153.92,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 532.57,
"t": 176.76,
"r": 542.54,
"b": 184.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.57,
"r_y0": 184.05,
"r_x1": 542.54,
"r_y1": 184.05,
"r_x2": 542.54,
"r_y2": 176.76,
"r_x3": 532.57,
"r_y3": 176.76,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 532.15,
"t": 199.65,
"r": 542.11,
"b": 206.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.15,
"r_y0": 206.94,
"r_x1": 542.11,
"r_y1": 206.94,
"r_x2": 542.11,
"r_y2": 199.65,
"r_x3": 532.15,
"r_y3": 199.65,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 7,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 267.84,
"r": 545.12,
"b": 288.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.967,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 276.74,
"r_x1": 346.06,
"r_y1": 276.74,
"r_x2": 346.06,
"r_y2": 267.84,
"r_x3": 308.86,
"r_y3": 267.84,
"coord_origin": "TOPLEFT"
},
"text": "Figure 2:",
"orig": "Figure 2:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.49,
"r_y0": 276.74,
"r_x1": 545.12,
"r_y1": 276.74,
"r_x2": 545.12,
"r_y2": 267.84,
"r_x3": 354.49,
"r_y3": 267.84,
"coord_origin": "TOPLEFT"
},
"text": "Distribution of the tables across different table",
"orig": "Distribution of the tables across different table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 288.7,
"r_x1": 498.57,
"r_y1": 288.7,
"r_x2": 498.57,
"r_y2": 279.79,
"r_x3": 308.86,
"r_y3": 279.79,
"coord_origin": "TOPLEFT"
},
"text": "dimensions in PubTabNet + FinTabNet datasets",
"orig": "dimensions in PubTabNet + FinTabNet datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "text",
"bbox": {
"l": 308.86,
"t": 317.47,
"r": 437.27,
"b": 326.38,
"coord_origin": "TOPLEFT"
},
"confidence": 0.888,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 326.38,
"r_x1": 437.27,
"r_y1": 326.38,
"r_x2": 437.27,
"r_y2": 317.47,
"r_x3": 308.86,
"r_y3": 317.47,
"coord_origin": "TOPLEFT"
},
"text": "balance in the previous datasets.",
"orig": "balance in the previous datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 331.53,
"r": 545.12,
"b": 627.36,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 340.44,
"r_x1": 545.12,
"r_y1": 340.44,
"r_x2": 545.12,
"r_y2": 331.53,
"r_x3": 320.82,
"r_y3": 331.53,
"coord_origin": "TOPLEFT"
},
"text": "The PubTabNet dataset contains 509k tables delivered as",
"orig": "The PubTabNet dataset contains 509k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 352.39,
"r_x1": 545.12,
"r_y1": 352.39,
"r_x2": 545.12,
"r_y2": 343.49,
"r_x3": 308.86,
"r_y3": 343.49,
"coord_origin": "TOPLEFT"
},
"text": "annotated PNG images. The annotations consist of the table",
"orig": "annotated PNG images. The annotations consist of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 364.35,
"r_x1": 545.12,
"r_y1": 364.35,
"r_x2": 545.12,
"r_y2": 355.44,
"r_x3": 308.86,
"r_y3": 355.44,
"coord_origin": "TOPLEFT"
},
"text": "structure represented in HTML format, the tokenized text",
"orig": "structure represented in HTML format, the tokenized text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 376.3,
"r_x1": 545.12,
"r_y1": 376.3,
"r_x2": 545.12,
"r_y2": 367.4,
"r_x3": 308.86,
"r_y3": 367.4,
"coord_origin": "TOPLEFT"
},
"text": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 388.26,
"r_x1": 545.12,
"r_y1": 388.26,
"r_x2": 545.12,
"r_y2": 379.35,
"r_x3": 308.86,
"r_y3": 379.35,
"coord_origin": "TOPLEFT"
},
"text": "pearance style of PubTabNet. Depending on its complexity,",
"orig": "pearance style of PubTabNet. Depending on its complexity,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.21,
"r_x1": 545.12,
"r_y1": 400.21,
"r_x2": 545.12,
"r_y2": 391.31,
"r_x3": 308.86,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "a table is characterized as \u201csimple\u201d when it does not contain",
"orig": "a table is characterized as \u201csimple\u201d when it does not contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.17,
"r_x1": 545.12,
"r_y1": 412.17,
"r_x2": 545.12,
"r_y2": 403.26,
"r_x3": 308.86,
"r_y3": 403.26,
"coord_origin": "TOPLEFT"
},
"text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.12,
"r_x1": 545.12,
"r_y1": 424.12,
"r_x2": 545.12,
"r_y2": 415.22,
"r_x3": 308.86,
"r_y3": 415.22,
"coord_origin": "TOPLEFT"
},
"text": "dataset is divided into Train and Val splits (roughly 98% and",
"orig": "dataset is divided into Train and Val splits (roughly 98% and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.08,
"r_x1": 545.12,
"r_y1": 436.08,
"r_x2": 545.12,
"r_y2": 427.17,
"r_x3": 308.86,
"r_y3": 427.17,
"coord_origin": "TOPLEFT"
},
"text": "2%). The Train split consists of 54% simple and 46% com-",
"orig": "2%). The Train split consists of 54% simple and 46% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.03,
"r_x1": 545.12,
"r_y1": 448.03,
"r_x2": 545.12,
"r_y2": 439.13,
"r_x3": 308.86,
"r_y3": 439.13,
"coord_origin": "TOPLEFT"
},
"text": "plex tables and the Val split of 51% and 49% respectively.",
"orig": "plex tables and the Val split of 51% and 49% respectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 459.99,
"r_x1": 545.12,
"r_y1": 459.99,
"r_x2": 545.12,
"r_y2": 451.08,
"r_x3": 308.86,
"r_y3": 451.08,
"coord_origin": "TOPLEFT"
},
"text": "The FinTabNet dataset contains 112k tables delivered as",
"orig": "The FinTabNet dataset contains 112k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 471.94,
"r_x1": 545.12,
"r_y1": 471.94,
"r_x2": 545.12,
"r_y2": 463.04,
"r_x3": 308.86,
"r_y3": 463.04,
"coord_origin": "TOPLEFT"
},
"text": "single-page PDF documents with mixed table structures and",
"orig": "single-page PDF documents with mixed table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 483.9,
"r_x1": 545.12,
"r_y1": 483.9,
"r_x2": 545.12,
"r_y2": 474.99,
"r_x3": 308.86,
"r_y3": 474.99,
"coord_origin": "TOPLEFT"
},
"text": "text content. Similarly to the PubTabNet, the annotations",
"orig": "text content. Similarly to the PubTabNet, the annotations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 495.86,
"r_x1": 545.12,
"r_y1": 495.86,
"r_x2": 545.12,
"r_y2": 486.95,
"r_x3": 308.86,
"r_y3": 486.95,
"coord_origin": "TOPLEFT"
},
"text": "of FinTabNet include the table structure in HTML, the to-",
"orig": "of FinTabNet include the table structure in HTML, the to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 507.81,
"r_x1": 545.12,
"r_y1": 507.81,
"r_x2": 545.12,
"r_y2": 498.9,
"r_x3": 308.86,
"r_y3": 498.9,
"coord_origin": "TOPLEFT"
},
"text": "kenized text and the bounding boxes on a table cell basis.",
"orig": "kenized text and the bounding boxes on a table cell basis.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 519.77,
"r_x1": 545.12,
"r_y1": 519.77,
"r_x2": 545.12,
"r_y2": 510.86,
"r_x3": 308.86,
"r_y3": 510.86,
"coord_origin": "TOPLEFT"
},
"text": "The dataset is divided into Train, Test and Val splits (81%,",
"orig": "The dataset is divided into Train, Test and Val splits (81%,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 531.72,
"r_x1": 545.12,
"r_y1": 531.72,
"r_x2": 545.12,
"r_y2": 522.81,
"r_x3": 308.86,
"r_y3": 522.81,
"coord_origin": "TOPLEFT"
},
"text": "9.5%, 9.5%), and each one is almost equally divided into",
"orig": "9.5%, 9.5%), and each one is almost equally divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 543.68,
"r_x1": 545.12,
"r_y1": 543.68,
"r_x2": 545.12,
"r_y2": 534.77,
"r_x3": 308.86,
"r_y3": 534.77,
"coord_origin": "TOPLEFT"
},
"text": "simple and complex tables (Train: 48% simple, 52% com-",
"orig": "simple and complex tables (Train: 48% simple, 52% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 555.63,
"r_x1": 545.12,
"r_y1": 555.63,
"r_x2": 545.12,
"r_y2": 546.72,
"r_x3": 308.86,
"r_y3": 546.72,
"coord_origin": "TOPLEFT"
},
"text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 567.59,
"r_x1": 545.12,
"r_y1": 567.59,
"r_x2": 545.12,
"r_y2": 558.68,
"r_x3": 308.86,
"r_y3": 558.68,
"coord_origin": "TOPLEFT"
},
"text": "47% complex). Finally the TableBank dataset consists of",
"orig": "47% complex). Finally the TableBank dataset consists of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 579.54,
"r_x1": 545.12,
"r_y1": 579.54,
"r_x2": 545.12,
"r_y2": 570.64,
"r_x3": 308.86,
"r_y3": 570.64,
"coord_origin": "TOPLEFT"
},
"text": "145k tables provided as JPEG images. The latter has anno-",
"orig": "145k tables provided as JPEG images. The latter has anno-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 591.5,
"r_x1": 545.11,
"r_y1": 591.5,
"r_x2": 545.11,
"r_y2": 582.59,
"r_x3": 308.86,
"r_y3": 582.59,
"coord_origin": "TOPLEFT"
},
"text": "tations for the table structure, but only few with bounding",
"orig": "tations for the table structure, but only few with bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 603.45,
"r_x1": 545.12,
"r_y1": 603.45,
"r_x2": 545.12,
"r_y2": 594.55,
"r_x3": 308.86,
"r_y3": 594.55,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the table cells. The entire dataset consists of sim-",
"orig": "boxes of the table cells. The entire dataset consists of sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 615.41,
"r_x1": 545.12,
"r_y1": 615.41,
"r_x2": 545.12,
"r_y2": 606.5,
"r_x3": 308.86,
"r_y3": 606.5,
"coord_origin": "TOPLEFT"
},
"text": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"orig": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 627.36,
"r_x1": 348.16,
"r_y1": 627.36,
"r_x2": 348.16,
"r_y2": 618.46,
"r_x3": 308.86,
"r_y3": 618.46,
"coord_origin": "TOPLEFT"
},
"text": "Val splits.",
"orig": "Val splits.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 308.86,
"t": 632.51,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 641.42,
"r_x1": 545.11,
"r_y1": 641.42,
"r_x2": 545.11,
"r_y2": 632.51,
"r_x3": 320.82,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "Due to the heterogeneity across the dataset formats, it",
"orig": "Due to the heterogeneity across the dataset formats, it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.38,
"r_x1": 545.12,
"r_y1": 653.38,
"r_x2": 545.12,
"r_y2": 644.47,
"r_x3": 308.86,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "was necessary to combine all available data into one homog-",
"orig": "was necessary to combine all available data into one homog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.33,
"r_x1": 545.12,
"r_y1": 665.33,
"r_x2": 545.12,
"r_y2": 656.42,
"r_x3": 308.86,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "enized dataset before we could train our models for practi-",
"orig": "enized dataset before we could train our models for practi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "cal purposes. Given the size of PubTabNet, we adopted its",
"orig": "cal purposes. Given the size of PubTabNet, we adopted its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "annotation format and we extracted and converted all tables",
"orig": "annotation format and we extracted and converted all tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "as PNG images with a resolution of 72 dpi. Additionally,",
"orig": "as PNG images with a resolution of 72 dpi. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "we have filtered out tables with extreme sizes due to small",
"orig": "we have filtered out tables with extreme sizes due to small",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 10,
"page_no": 2,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 250.15,
"b": 84.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 250.15,
"r_y1": 84.11,
"r_x2": 250.15,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder which is constrained to the table-tags.",
"orig": "tag-decoder which is constrained to the table-tags.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "tag-decoder which is constrained to the table-tags."
},
{
"label": "text",
"id": 5,
"page_no": 2,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 87.22,
"r": 286.37,
"b": 275.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 96.13,
"r_x1": 70.37,
"r_y1": 96.13,
"r_x2": 70.37,
"r_y2": 87.22,
"r_x3": 62.07,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.93,
"r_y0": 96.13,
"r_x1": 110.95,
"r_y1": 96.13,
"r_x2": 110.95,
"r_y2": 87.22,
"r_x3": 76.93,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "practice,",
"orig": "practice,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.54,
"r_y0": 96.13,
"r_x1": 136.26,
"r_y1": 96.13,
"r_x2": 136.26,
"r_y2": 87.22,
"r_x3": 118.54,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "both",
"orig": "both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.82,
"r_y0": 96.13,
"r_x1": 175.37,
"r_y1": 96.13,
"r_x2": 175.37,
"r_y2": 87.22,
"r_x3": 142.82,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "network",
"orig": "network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.95,
"r_y0": 96.13,
"r_x1": 232.84,
"r_y1": 96.13,
"r_x2": 232.84,
"r_y2": 87.22,
"r_x3": 181.95,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "architectures",
"orig": "architectures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.41,
"r_y0": 96.13,
"r_x1": 265.41,
"r_y1": 96.13,
"r_x2": 265.41,
"r_y2": 87.22,
"r_x3": 239.41,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "(IETD",
"orig": "(IETD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 271.98,
"r_y0": 96.13,
"r_x1": 286.36,
"r_y1": 96.13,
"r_x2": 286.36,
"r_y2": 87.22,
"r_x3": 271.98,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.08,
"r_x1": 286.37,
"r_y1": 108.08,
"r_x2": 286.37,
"r_y2": 99.17,
"r_x3": 50.11,
"r_y3": 99.17,
"coord_origin": "TOPLEFT"
},
"text": "IEDD) require an implicit, custom trained object-character-",
"orig": "IEDD) require an implicit, custom trained object-character-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 120.04,
"r_x1": 286.37,
"r_y1": 120.04,
"r_x2": 286.37,
"r_y2": 111.13,
"r_x3": 50.11,
"r_y3": 111.13,
"coord_origin": "TOPLEFT"
},
"text": "recognition (OCR) to obtain the content of the table-cells.",
"orig": "recognition (OCR) to obtain the content of the table-cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.99,
"r_x1": 286.37,
"r_y1": 131.99,
"r_x2": 286.37,
"r_y2": 123.09,
"r_x3": 50.11,
"r_y3": 123.09,
"coord_origin": "TOPLEFT"
},
"text": "In the case of IETD, this OCR engine is implicit in the de-",
"orig": "In the case of IETD, this OCR engine is implicit in the de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 143.95,
"r_x1": 286.37,
"r_y1": 143.95,
"r_x2": 286.37,
"r_y2": 135.04,
"r_x3": 50.11,
"r_y3": 135.04,
"coord_origin": "TOPLEFT"
},
"text": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"orig": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 155.9,
"r_x1": 286.37,
"r_y1": 155.9,
"r_x2": 286.37,
"r_y2": 147.0,
"r_x3": 50.11,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "bedded in the content-decoder. This reliance on a custom,",
"orig": "bedded in the content-decoder. This reliance on a custom,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 167.86,
"r_x1": 286.37,
"r_y1": 167.86,
"r_x2": 286.37,
"r_y2": 158.95,
"r_x3": 50.11,
"r_y3": 158.95,
"coord_origin": "TOPLEFT"
},
"text": "implicit OCR decoder is of course problematic. OCR is a",
"orig": "implicit OCR decoder is of course problematic. OCR is a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 179.81,
"r_x1": 286.37,
"r_y1": 179.81,
"r_x2": 286.37,
"r_y2": 170.91,
"r_x3": 50.11,
"r_y3": 170.91,
"coord_origin": "TOPLEFT"
},
"text": "well known and extremely tough problem, that often needs",
"orig": "well known and extremely tough problem, that often needs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 191.77,
"r_x1": 286.37,
"r_y1": 191.77,
"r_x2": 286.37,
"r_y2": 182.86,
"r_x3": 50.11,
"r_y3": 182.86,
"coord_origin": "TOPLEFT"
},
"text": "custom training for each individual language. However, the",
"orig": "custom training for each individual language. However, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 203.72,
"r_x1": 286.37,
"r_y1": 203.72,
"r_x2": 286.37,
"r_y2": 194.82,
"r_x3": 50.11,
"r_y3": 194.82,
"coord_origin": "TOPLEFT"
},
"text": "limited availability for non-english content in the current",
"orig": "limited availability for non-english content in the current",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 215.68,
"r_x1": 286.37,
"r_y1": 215.68,
"r_x2": 286.37,
"r_y2": 206.77,
"r_x3": 50.11,
"r_y3": 206.77,
"coord_origin": "TOPLEFT"
},
"text": "datasets, makes it impractical to apply the IETD and IEDD",
"orig": "datasets, makes it impractical to apply the IETD and IEDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 227.63,
"r_x1": 286.37,
"r_y1": 227.63,
"r_x2": 286.37,
"r_y2": 218.73,
"r_x3": 50.11,
"r_y3": 218.73,
"coord_origin": "TOPLEFT"
},
"text": "methods on tables with other languages. Additionally, OCR",
"orig": "methods on tables with other languages. Additionally, OCR",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 239.59,
"r_x1": 286.37,
"r_y1": 239.59,
"r_x2": 286.37,
"r_y2": 230.68,
"r_x3": 50.11,
"r_y3": 230.68,
"coord_origin": "TOPLEFT"
},
"text": "can be completely omitted if the tables originate from pro-",
"orig": "can be completely omitted if the tables originate from pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 251.54,
"r_x1": 286.37,
"r_y1": 251.54,
"r_x2": 286.37,
"r_y2": 242.64,
"r_x3": 50.11,
"r_y3": 242.64,
"coord_origin": "TOPLEFT"
},
"text": "grammatic PDF documents with known positions of each",
"orig": "grammatic PDF documents with known positions of each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 263.5,
"r_x1": 286.37,
"r_y1": 263.5,
"r_x2": 286.37,
"r_y2": 254.59,
"r_x3": 50.11,
"r_y3": 254.59,
"coord_origin": "TOPLEFT"
},
"text": "cell. The latter was the inspiration for the work of this pa-",
"orig": "cell. The latter was the inspiration for the work of this pa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 275.45,
"r_x1": 64.78,
"r_y1": 275.45,
"r_x2": 64.78,
"r_y2": 266.55,
"r_x3": 50.11,
"r_y3": 266.55,
"coord_origin": "TOPLEFT"
},
"text": "per.",
"orig": "per.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper."
},
{
"label": "text",
"id": 0,
"page_no": 2,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 278.44,
"r": 286.37,
"b": 490.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 287.4,
"r_x1": 171.57,
"r_y1": 287.4,
"r_x2": 171.57,
"r_y2": 278.44,
"r_x3": 62.07,
"r_y3": 278.44,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.57,
"r_y0": 287.47,
"r_x1": 174.34,
"r_y1": 287.47,
"r_x2": 174.34,
"r_y2": 278.56,
"r_x3": 171.57,
"r_y3": 278.56,
"coord_origin": "TOPLEFT"
},
"text": ":",
"orig": ":",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.19,
"r_y0": 287.47,
"r_x1": 286.36,
"r_y1": 287.47,
"r_x2": 286.36,
"r_y2": 278.56,
"r_x3": 185.19,
"r_y3": 278.56,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 299.42,
"r_x1": 286.37,
"r_y1": 299.42,
"r_x2": 286.37,
"r_y2": 290.51,
"r_x3": 50.11,
"r_y3": 290.51,
"coord_origin": "TOPLEFT"
},
"text": "(GNN\u2019s) take a radically different approach to table-",
"orig": "(GNN\u2019s) take a radically different approach to table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 311.38,
"r_x1": 131.17,
"r_y1": 311.38,
"r_x2": 131.17,
"r_y2": 302.47,
"r_x3": 50.11,
"r_y3": 302.47,
"coord_origin": "TOPLEFT"
},
"text": "structure extraction.",
"orig": "structure extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.85,
"r_y0": 311.38,
"r_x1": 286.37,
"r_y1": 311.38,
"r_x2": 286.37,
"r_y2": 302.47,
"r_x3": 138.85,
"r_y3": 302.47,
"coord_origin": "TOPLEFT"
},
"text": "Note that one table cell can consti-",
"orig": "Note that one table cell can consti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 323.33,
"r_x1": 286.37,
"r_y1": 323.33,
"r_x2": 286.37,
"r_y2": 314.42,
"r_x3": 50.11,
"r_y3": 314.42,
"coord_origin": "TOPLEFT"
},
"text": "tute out of multiple text-cells. To obtain the table-structure,",
"orig": "tute out of multiple text-cells. To obtain the table-structure,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 335.29,
"r_x1": 286.37,
"r_y1": 335.29,
"r_x2": 286.37,
"r_y2": 326.38,
"r_x3": 50.11,
"r_y3": 326.38,
"coord_origin": "TOPLEFT"
},
"text": "one creates an initial graph, where each of the text-cells",
"orig": "one creates an initial graph, where each of the text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 347.24,
"r_x1": 286.37,
"r_y1": 347.24,
"r_x2": 286.37,
"r_y2": 338.33,
"r_x3": 50.11,
"r_y3": 338.33,
"coord_origin": "TOPLEFT"
},
"text": "becomes a node in the graph similar to [33, 34, 2]. Each",
"orig": "becomes a node in the graph similar to [33, 34, 2]. Each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.2,
"r_x1": 286.37,
"r_y1": 359.2,
"r_x2": 286.37,
"r_y2": 350.29,
"r_x3": 50.11,
"r_y3": 350.29,
"coord_origin": "TOPLEFT"
},
"text": "node is then associated with en embedding vector coming",
"orig": "node is then associated with en embedding vector coming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.15,
"r_x1": 286.37,
"r_y1": 371.15,
"r_x2": 286.37,
"r_y2": 362.25,
"r_x3": 50.11,
"r_y3": 362.25,
"coord_origin": "TOPLEFT"
},
"text": "from the encoded image, its coordinates and the encoded",
"orig": "from the encoded image, its coordinates and the encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 383.11,
"r_x1": 286.37,
"r_y1": 383.11,
"r_x2": 286.37,
"r_y2": 374.2,
"r_x3": 50.11,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "text. Furthermore, nodes that represent adjacent text-cells",
"orig": "text. Furthermore, nodes that represent adjacent text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 395.06,
"r_x1": 286.37,
"r_y1": 395.06,
"r_x2": 286.37,
"r_y2": 386.16,
"r_x3": 50.11,
"r_y3": 386.16,
"coord_origin": "TOPLEFT"
},
"text": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 407.02,
"r_x1": 286.37,
"r_y1": 407.02,
"r_x2": 286.37,
"r_y2": 398.11,
"r_x3": 50.11,
"r_y3": 398.11,
"coord_origin": "TOPLEFT"
},
"text": "methods take the image as an input, but also the position of",
"orig": "methods take the image as an input, but also the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 418.97,
"r_x1": 286.37,
"r_y1": 418.97,
"r_x2": 286.37,
"r_y2": 410.07,
"r_x3": 50.11,
"r_y3": 410.07,
"coord_origin": "TOPLEFT"
},
"text": "the text-cells and their content [18]. The purpose of a GCN",
"orig": "the text-cells and their content [18]. The purpose of a GCN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 430.93,
"r_x1": 286.37,
"r_y1": 430.93,
"r_x2": 286.37,
"r_y2": 422.02,
"r_x3": 50.11,
"r_y3": 422.02,
"coord_origin": "TOPLEFT"
},
"text": "is to transform the input graph into a new graph, which re-",
"orig": "is to transform the input graph into a new graph, which re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 442.88,
"r_x1": 198.24,
"r_y1": 442.88,
"r_x2": 198.24,
"r_y2": 433.98,
"r_x3": 50.11,
"r_y3": 433.98,
"coord_origin": "TOPLEFT"
},
"text": "places the old links with new ones.",
"orig": "places the old links with new ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.93,
"r_y0": 442.88,
"r_x1": 286.37,
"r_y1": 442.88,
"r_x2": 286.37,
"r_y2": 433.98,
"r_x3": 205.93,
"r_y3": 433.98,
"coord_origin": "TOPLEFT"
},
"text": "The new links then",
"orig": "The new links then",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 454.84,
"r_x1": 286.37,
"r_y1": 454.84,
"r_x2": 286.37,
"r_y2": 445.93,
"r_x3": 50.11,
"r_y3": 445.93,
"coord_origin": "TOPLEFT"
},
"text": "represent the table-structure. With this approach, one can",
"orig": "represent the table-structure. With this approach, one can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 466.79,
"r_x1": 286.37,
"r_y1": 466.79,
"r_x2": 286.37,
"r_y2": 457.89,
"r_x3": 50.11,
"r_y3": 457.89,
"coord_origin": "TOPLEFT"
},
"text": "avoid the need to build custom OCR decoders. However,",
"orig": "avoid the need to build custom OCR decoders. However,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 478.75,
"r_x1": 286.37,
"r_y1": 478.75,
"r_x2": 286.37,
"r_y2": 469.84,
"r_x3": 50.11,
"r_y3": 469.84,
"coord_origin": "TOPLEFT"
},
"text": "the quality of the reconstructed structure is not comparable",
"orig": "the quality of the reconstructed structure is not comparable",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 490.7,
"r_x1": 186.5,
"r_y1": 490.7,
"r_x2": 186.5,
"r_y2": 481.8,
"r_x3": 50.11,
"r_y3": 481.8,
"coord_origin": "TOPLEFT"
},
"text": "to the current state-of-the-art [18].",
"orig": "to the current state-of-the-art [18].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]."
},
{
"label": "text",
"id": 1,
"page_no": 2,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 493.69,
"r": 286.37,
"b": 622.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 502.65,
"r_x1": 252.88,
"r_y1": 502.65,
"r_x2": 252.88,
"r_y2": 493.69,
"r_x3": 62.07,
"r_y3": 493.69,
"coord_origin": "TOPLEFT"
},
"text": "Hybrid Deep Learning-Rule-Based approach",
"orig": "Hybrid Deep Learning-Rule-Based approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 252.88,
"r_y0": 502.71,
"r_x1": 286.37,
"r_y1": 502.71,
"r_x2": 286.37,
"r_y2": 493.81,
"r_x3": 252.88,
"r_y3": 493.81,
"coord_origin": "TOPLEFT"
},
"text": ": A pop-",
"orig": ": A pop-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 514.67,
"r_x1": 286.37,
"r_y1": 514.67,
"r_x2": 286.37,
"r_y2": 505.76,
"r_x3": 50.11,
"r_y3": 505.76,
"coord_origin": "TOPLEFT"
},
"text": "ular current model for table-structure identification is the",
"orig": "ular current model for table-structure identification is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 526.62,
"r_x1": 286.37,
"r_y1": 526.62,
"r_x2": 286.37,
"r_y2": 517.72,
"r_x3": 50.11,
"r_y3": 517.72,
"coord_origin": "TOPLEFT"
},
"text": "use of a hybrid Deep Learning-Rule-Based approach similar",
"orig": "use of a hybrid Deep Learning-Rule-Based approach similar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 538.58,
"r_x1": 286.37,
"r_y1": 538.58,
"r_x2": 286.37,
"r_y2": 529.67,
"r_x3": 50.11,
"r_y3": 529.67,
"coord_origin": "TOPLEFT"
},
"text": "to [27, 29]. In this approach, one first detects the position of",
"orig": "to [27, 29]. In this approach, one first detects the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 550.54,
"r_x1": 286.37,
"r_y1": 550.54,
"r_x2": 286.37,
"r_y2": 541.63,
"r_x3": 50.11,
"r_y3": 541.63,
"coord_origin": "TOPLEFT"
},
"text": "the table-cells with object detection (e.g. YoloVx or Mask-",
"orig": "the table-cells with object detection (e.g. YoloVx or Mask-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 562.49,
"r_x1": 286.37,
"r_y1": 562.49,
"r_x2": 286.37,
"r_y2": 553.58,
"r_x3": 50.11,
"r_y3": 553.58,
"coord_origin": "TOPLEFT"
},
"text": "RCNN), then classifies the table into different types (from",
"orig": "RCNN), then classifies the table into different types (from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 574.45,
"r_x1": 286.37,
"r_y1": 574.45,
"r_x2": 286.37,
"r_y2": 565.54,
"r_x3": 50.11,
"r_y3": 565.54,
"coord_origin": "TOPLEFT"
},
"text": "its images) and finally uses different rule-sets to obtain",
"orig": "its images) and finally uses different rule-sets to obtain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 586.4,
"r_x1": 286.37,
"r_y1": 586.4,
"r_x2": 286.37,
"r_y2": 577.49,
"r_x3": 50.11,
"r_y3": 577.49,
"coord_origin": "TOPLEFT"
},
"text": "its table-structure. Currently, this approach achieves state-",
"orig": "its table-structure. Currently, this approach achieves state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 598.36,
"r_x1": 286.37,
"r_y1": 598.36,
"r_x2": 286.37,
"r_y2": 589.45,
"r_x3": 50.11,
"r_y3": 589.45,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art results, but is not an end-to-end deep-learning",
"orig": "of-the-art results, but is not an end-to-end deep-learning",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 610.31,
"r_x1": 286.37,
"r_y1": 610.31,
"r_x2": 286.37,
"r_y2": 601.4,
"r_x3": 50.11,
"r_y3": 601.4,
"coord_origin": "TOPLEFT"
},
"text": "method. As such, new rules need to be written if different",
"orig": "method. As such, new rules need to be written if different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 622.27,
"r_x1": 175.99,
"r_y1": 622.27,
"r_x2": 175.99,
"r_y2": 613.36,
"r_x3": 50.11,
"r_y3": 613.36,
"coord_origin": "TOPLEFT"
},
"text": "types of tables are encountered.",
"orig": "types of tables are encountered.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Hybrid Deep Learning-Rule-Based approach : A popular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered."
},
{
"label": "section_header",
"id": 8,
"page_no": 2,
"cluster": {
"id": 8,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 635.94,
"r": 105.23,
"b": 646.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 646.69,
"r_x1": 57.82,
"r_y1": 646.69,
"r_x2": 57.82,
"r_y2": 635.94,
"r_x3": 50.11,
"r_y3": 635.94,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.11,
"r_y0": 646.69,
"r_x1": 105.23,
"r_y1": 646.69,
"r_x2": 105.23,
"r_y2": 635.94,
"r_x3": 68.11,
"r_y3": 635.94,
"coord_origin": "TOPLEFT"
},
"text": "Datasets",
"orig": "Datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Datasets"
},
{
"label": "text",
"id": 3,
"page_no": 2,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 656.43,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 665.33,
"r_x1": 286.36,
"r_y1": 665.33,
"r_x2": 286.36,
"r_y2": 656.43,
"r_x3": 62.07,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "We rely on large-scale datasets such as PubTabNet [37],",
"orig": "We rely on large-scale datasets such as PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] datasets to train and",
"orig": "FinTabNet [36], and TableBank [17] datasets to train and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "evaluate our models. These datasets span over various ap-",
"orig": "evaluate our models. These datasets span over various ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 166.25,
"r_y1": 701.2,
"r_x2": 166.25,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "pearance styles and content.",
"orig": "pearance styles and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 173.69,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 173.69,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "We also introduce our own",
"orig": "We also introduce our own",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "synthetically generated SynthTabNet dataset to fix an im-",
"orig": "synthetically generated SynthTabNet dataset to fix an im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-"
},
{
"label": "picture",
"id": 6,
"page_no": 2,
"cluster": {
"id": 6,
"label": "picture",
"bbox": {
"l": 312.1,
"t": 78.44,
"r": 550.39,
"b": 250.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.975,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.56,
"r_x1": 486.85,
"r_y1": 88.56,
"r_x2": 486.85,
"r_y2": 79.81,
"r_x3": 380.8,
"r_y3": 79.81,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.77,
"r_y0": 250.77,
"r_x1": 469.79,
"r_y1": 250.77,
"r_x2": 469.79,
"r_y2": 242.03,
"r_x3": 396.77,
"r_y3": 242.03,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.98,
"r_y0": 239.25,
"r_x1": 324.79,
"r_y1": 239.25,
"r_x2": 324.79,
"r_y2": 233.42,
"r_x3": 320.98,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.48,
"r_y0": 239.25,
"r_x1": 418.11,
"r_y1": 239.25,
"r_x2": 418.11,
"r_y2": 233.42,
"r_x3": 410.48,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.85,
"r_y0": 239.25,
"r_x1": 508.48,
"r_y1": 239.25,
"r_x2": 508.48,
"r_y2": 233.42,
"r_x3": 500.85,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.25,
"r_x1": 372.93,
"r_y1": 239.25,
"r_x2": 372.93,
"r_y2": 233.42,
"r_x3": 365.3,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.67,
"r_y0": 239.25,
"r_x1": 463.3,
"r_y1": 239.25,
"r_x2": 463.3,
"r_y2": 233.42,
"r_x3": 455.67,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.04,
"r_y0": 239.25,
"r_x1": 549.67,
"r_y1": 239.25,
"r_x2": 549.67,
"r_y2": 233.42,
"r_x3": 542.04,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.04,
"r_y0": 236.28,
"r_x1": 319.86,
"r_y1": 236.28,
"r_x2": 319.86,
"r_y2": 230.45,
"r_x3": 316.04,
"r_y3": 230.45,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.63,
"r_y0": 204.52,
"r_x1": 316.44,
"r_y1": 204.52,
"r_x2": 316.44,
"r_y2": 198.69,
"r_x3": 312.63,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.44,
"r_y0": 204.52,
"r_x1": 320.26,
"r_y1": 204.52,
"r_x2": 320.26,
"r_y2": 198.69,
"r_x3": 316.44,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.15,
"r_y0": 173.93,
"r_x1": 316.97,
"r_y1": 173.93,
"r_x2": 316.97,
"r_y2": 168.1,
"r_x3": 313.15,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.96,
"r_y0": 173.93,
"r_x1": 320.78,
"r_y1": 173.93,
"r_x2": 320.78,
"r_y2": 168.1,
"r_x3": 316.96,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.93,
"r_y0": 142.42,
"r_x1": 316.75,
"r_y1": 142.42,
"r_x2": 316.75,
"r_y2": 136.59,
"r_x3": 312.93,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.74,
"r_y0": 142.42,
"r_x1": 320.56,
"r_y1": 142.42,
"r_x2": 320.56,
"r_y2": 136.59,
"r_x3": 316.74,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 111.43,
"r_x1": 316.3,
"r_y1": 111.43,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.48,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.43,
"r_x1": 320.11,
"r_y1": 111.43,
"r_x2": 320.11,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 218.09,
"r_x1": 316.3,
"r_y1": 218.09,
"r_x2": 316.3,
"r_y2": 212.26,
"r_x3": 312.48,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.09,
"r_x1": 320.11,
"r_y1": 218.09,
"r_x2": 320.11,
"r_y2": 212.26,
"r_x3": 316.3,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.08,
"r_y0": 189.55,
"r_x1": 316.89,
"r_y1": 189.55,
"r_x2": 316.89,
"r_y2": 183.72,
"r_x3": 313.08,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.89,
"r_y0": 189.55,
"r_x1": 320.71,
"r_y1": 189.55,
"r_x2": 320.71,
"r_y2": 183.72,
"r_x3": 316.89,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.76,
"r_y0": 158.31,
"r_x1": 316.58,
"r_y1": 158.31,
"r_x2": 316.58,
"r_y2": 152.47,
"r_x3": 312.76,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.58,
"r_y0": 158.31,
"r_x1": 320.39,
"r_y1": 158.31,
"r_x2": 320.39,
"r_y2": 152.47,
"r_x3": 316.58,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.01,
"r_y1": 126.4,
"r_x2": 316.01,
"r_y2": 120.57,
"r_x3": 312.2,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.01,
"r_y0": 126.4,
"r_x1": 319.83,
"r_y1": 126.4,
"r_x2": 319.83,
"r_y2": 120.57,
"r_x3": 316.01,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.82,
"r_y0": 95.94,
"r_x1": 316.63,
"r_y1": 95.94,
"r_x2": 316.63,
"r_y2": 90.11,
"r_x3": 312.82,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.63,
"r_y0": 95.94,
"r_x1": 320.45,
"r_y1": 95.94,
"r_x2": 320.45,
"r_y2": 90.11,
"r_x3": 316.63,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.17,
"r_y0": 230.02,
"r_x1": 536.94,
"r_y1": 230.02,
"r_x2": 536.94,
"r_y2": 222.73,
"r_x3": 532.17,
"r_y3": 222.73,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.88,
"r_y0": 115.56,
"r_x1": 547.61,
"r_y1": 115.56,
"r_x2": 547.61,
"r_y2": 108.27,
"r_x3": 532.88,
"r_y3": 108.27,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.77,
"r_y0": 138.07,
"r_x1": 542.74,
"r_y1": 138.07,
"r_x2": 542.74,
"r_y2": 130.78,
"r_x3": 532.77,
"r_y3": 130.78,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.21,
"r_x1": 542.76,
"r_y1": 161.21,
"r_x2": 542.76,
"r_y2": 153.92,
"r_x3": 532.8,
"r_y3": 153.92,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.57,
"r_y0": 184.05,
"r_x1": 542.54,
"r_y1": 184.05,
"r_x2": 542.54,
"r_y2": 176.76,
"r_x3": 532.57,
"r_y3": 176.76,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.15,
"r_y0": 206.94,
"r_x1": 542.11,
"r_y1": 206.94,
"r_x2": 542.11,
"r_y2": 199.65,
"r_x3": 532.15,
"r_y3": 199.65,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 380.8,
"t": 79.81,
"r": 486.85,
"b": 88.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.569,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.56,
"r_x1": 486.85,
"r_y1": 88.56,
"r_x2": 486.85,
"r_y2": 79.81,
"r_x3": 380.8,
"r_y3": 79.81,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 396.77,
"t": 242.03,
"r": 469.79,
"b": 250.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.77,
"r_y0": 250.77,
"r_x1": 469.79,
"r_y1": 250.77,
"r_x2": 469.79,
"r_y2": 242.03,
"r_x3": 396.77,
"r_y3": 242.03,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "text",
"bbox": {
"l": 320.98,
"t": 233.42,
"r": 324.79,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.98,
"r_y0": 239.25,
"r_x1": 324.79,
"r_y1": 239.25,
"r_x2": 324.79,
"r_y2": 233.42,
"r_x3": 320.98,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 410.48,
"t": 233.42,
"r": 418.11,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.48,
"r_y0": 239.25,
"r_x1": 418.11,
"r_y1": 239.25,
"r_x2": 418.11,
"r_y2": 233.42,
"r_x3": 410.48,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 500.85,
"t": 233.42,
"r": 508.48,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.85,
"r_y0": 239.25,
"r_x1": 508.48,
"r_y1": 239.25,
"r_x2": 508.48,
"r_y2": 233.42,
"r_x3": 500.85,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 365.3,
"t": 233.42,
"r": 372.93,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.25,
"r_x1": 372.93,
"r_y1": 239.25,
"r_x2": 372.93,
"r_y2": 233.42,
"r_x3": 365.3,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 455.67,
"t": 233.42,
"r": 463.3,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.67,
"r_y0": 239.25,
"r_x1": 463.3,
"r_y1": 239.25,
"r_x2": 463.3,
"r_y2": 233.42,
"r_x3": 455.67,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 542.04,
"t": 233.42,
"r": 549.67,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.04,
"r_y0": 239.25,
"r_x1": 549.67,
"r_y1": 239.25,
"r_x2": 549.67,
"r_y2": 233.42,
"r_x3": 542.04,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 316.04,
"t": 230.45,
"r": 319.86,
"b": 236.28,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.04,
"r_y0": 236.28,
"r_x1": 319.86,
"r_y1": 236.28,
"r_x2": 319.86,
"r_y2": 230.45,
"r_x3": 316.04,
"r_y3": 230.45,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 312.63,
"t": 198.69,
"r": 316.44,
"b": 204.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.63,
"r_y0": 204.52,
"r_x1": 316.44,
"r_y1": 204.52,
"r_x2": 316.44,
"r_y2": 198.69,
"r_x3": 312.63,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 316.44,
"t": 198.69,
"r": 320.26,
"b": 204.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.44,
"r_y0": 204.52,
"r_x1": 320.26,
"r_y1": 204.52,
"r_x2": 320.26,
"r_y2": 198.69,
"r_x3": 316.44,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 313.15,
"t": 168.1,
"r": 316.97,
"b": 173.93,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.15,
"r_y0": 173.93,
"r_x1": 316.97,
"r_y1": 173.93,
"r_x2": 316.97,
"r_y2": 168.1,
"r_x3": 313.15,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 316.96,
"t": 168.1,
"r": 320.78,
"b": 173.93,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.96,
"r_y0": 173.93,
"r_x1": 320.78,
"r_y1": 173.93,
"r_x2": 320.78,
"r_y2": 168.1,
"r_x3": 316.96,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 312.93,
"t": 136.59,
"r": 316.75,
"b": 142.42,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.93,
"r_y0": 142.42,
"r_x1": 316.75,
"r_y1": 142.42,
"r_x2": 316.75,
"r_y2": 136.59,
"r_x3": 312.93,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 316.74,
"t": 136.59,
"r": 320.56,
"b": 142.42,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.74,
"r_y0": 142.42,
"r_x1": 320.56,
"r_y1": 142.42,
"r_x2": 320.56,
"r_y2": 136.59,
"r_x3": 316.74,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 312.48,
"t": 105.6,
"r": 316.3,
"b": 111.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 111.43,
"r_x1": 316.3,
"r_y1": 111.43,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.48,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 316.3,
"t": 105.6,
"r": 320.11,
"b": 111.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.43,
"r_x1": 320.11,
"r_y1": 111.43,
"r_x2": 320.11,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 312.48,
"t": 212.26,
"r": 316.3,
"b": 218.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 218.09,
"r_x1": 316.3,
"r_y1": 218.09,
"r_x2": 316.3,
"r_y2": 212.26,
"r_x3": 312.48,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 316.3,
"t": 212.26,
"r": 320.11,
"b": 218.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.09,
"r_x1": 320.11,
"r_y1": 218.09,
"r_x2": 320.11,
"r_y2": 212.26,
"r_x3": 316.3,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 313.08,
"t": 183.72,
"r": 316.89,
"b": 189.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.08,
"r_y0": 189.55,
"r_x1": 316.89,
"r_y1": 189.55,
"r_x2": 316.89,
"r_y2": 183.72,
"r_x3": 313.08,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 316.89,
"t": 183.72,
"r": 320.71,
"b": 189.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.89,
"r_y0": 189.55,
"r_x1": 320.71,
"r_y1": 189.55,
"r_x2": 320.71,
"r_y2": 183.72,
"r_x3": 316.89,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 312.76,
"t": 152.47,
"r": 316.58,
"b": 158.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.76,
"r_y0": 158.31,
"r_x1": 316.58,
"r_y1": 158.31,
"r_x2": 316.58,
"r_y2": 152.47,
"r_x3": 312.76,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 316.58,
"t": 152.47,
"r": 320.39,
"b": 158.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.58,
"r_y0": 158.31,
"r_x1": 320.39,
"r_y1": 158.31,
"r_x2": 320.39,
"r_y2": 152.47,
"r_x3": 316.58,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 312.2,
"t": 120.57,
"r": 316.01,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.01,
"r_y1": 126.4,
"r_x2": 316.01,
"r_y2": 120.57,
"r_x3": 312.2,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 316.01,
"t": 120.57,
"r": 319.83,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.01,
"r_y0": 126.4,
"r_x1": 319.83,
"r_y1": 126.4,
"r_x2": 319.83,
"r_y2": 120.57,
"r_x3": 316.01,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 312.82,
"t": 90.11,
"r": 316.63,
"b": 95.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.82,
"r_y0": 95.94,
"r_x1": 316.63,
"r_y1": 95.94,
"r_x2": 316.63,
"r_y2": 90.11,
"r_x3": 312.82,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 316.63,
"t": 90.11,
"r": 320.45,
"b": 95.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.63,
"r_y0": 95.94,
"r_x1": 320.45,
"r_y1": 95.94,
"r_x2": 320.45,
"r_y2": 90.11,
"r_x3": 316.63,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 532.17,
"t": 222.73,
"r": 536.94,
"b": 230.02,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.17,
"r_y0": 230.02,
"r_x1": 536.94,
"r_y1": 230.02,
"r_x2": 536.94,
"r_y2": 222.73,
"r_x3": 532.17,
"r_y3": 222.73,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 532.88,
"t": 108.27,
"r": 547.61,
"b": 115.56,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.88,
"r_y0": 115.56,
"r_x1": 547.61,
"r_y1": 115.56,
"r_x2": 547.61,
"r_y2": 108.27,
"r_x3": 532.88,
"r_y3": 108.27,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 532.77,
"t": 130.78,
"r": 542.74,
"b": 138.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.77,
"r_y0": 138.07,
"r_x1": 542.74,
"r_y1": 138.07,
"r_x2": 542.74,
"r_y2": 130.78,
"r_x3": 532.77,
"r_y3": 130.78,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 532.8,
"t": 153.92,
"r": 542.76,
"b": 161.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.21,
"r_x1": 542.76,
"r_y1": 161.21,
"r_x2": 542.76,
"r_y2": 153.92,
"r_x3": 532.8,
"r_y3": 153.92,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 532.57,
"t": 176.76,
"r": 542.54,
"b": 184.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.57,
"r_y0": 184.05,
"r_x1": 542.54,
"r_y1": 184.05,
"r_x2": 542.54,
"r_y2": 176.76,
"r_x3": 532.57,
"r_y3": 176.76,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 532.15,
"t": 199.65,
"r": 542.11,
"b": 206.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.15,
"r_y0": 206.94,
"r_x1": 542.11,
"r_y1": 206.94,
"r_x2": 542.11,
"r_y2": 199.65,
"r_x3": 532.15,
"r_y3": 199.65,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 7,
"page_no": 2,
"cluster": {
"id": 7,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 267.84,
"r": 545.12,
"b": 288.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.967,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 276.74,
"r_x1": 346.06,
"r_y1": 276.74,
"r_x2": 346.06,
"r_y2": 267.84,
"r_x3": 308.86,
"r_y3": 267.84,
"coord_origin": "TOPLEFT"
},
"text": "Figure 2:",
"orig": "Figure 2:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.49,
"r_y0": 276.74,
"r_x1": 545.12,
"r_y1": 276.74,
"r_x2": 545.12,
"r_y2": 267.84,
"r_x3": 354.49,
"r_y3": 267.84,
"coord_origin": "TOPLEFT"
},
"text": "Distribution of the tables across different table",
"orig": "Distribution of the tables across different table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 288.7,
"r_x1": 498.57,
"r_y1": 288.7,
"r_x2": 498.57,
"r_y2": 279.79,
"r_x3": 308.86,
"r_y3": 279.79,
"coord_origin": "TOPLEFT"
},
"text": "dimensions in PubTabNet + FinTabNet datasets",
"orig": "dimensions in PubTabNet + FinTabNet datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets"
},
{
"label": "text",
"id": 9,
"page_no": 2,
"cluster": {
"id": 9,
"label": "text",
"bbox": {
"l": 308.86,
"t": 317.47,
"r": 437.27,
"b": 326.38,
"coord_origin": "TOPLEFT"
},
"confidence": 0.888,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 326.38,
"r_x1": 437.27,
"r_y1": 326.38,
"r_x2": 437.27,
"r_y2": 317.47,
"r_x3": 308.86,
"r_y3": 317.47,
"coord_origin": "TOPLEFT"
},
"text": "balance in the previous datasets.",
"orig": "balance in the previous datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "balance in the previous datasets."
},
{
"label": "text",
"id": 2,
"page_no": 2,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 331.53,
"r": 545.12,
"b": 627.36,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 340.44,
"r_x1": 545.12,
"r_y1": 340.44,
"r_x2": 545.12,
"r_y2": 331.53,
"r_x3": 320.82,
"r_y3": 331.53,
"coord_origin": "TOPLEFT"
},
"text": "The PubTabNet dataset contains 509k tables delivered as",
"orig": "The PubTabNet dataset contains 509k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 352.39,
"r_x1": 545.12,
"r_y1": 352.39,
"r_x2": 545.12,
"r_y2": 343.49,
"r_x3": 308.86,
"r_y3": 343.49,
"coord_origin": "TOPLEFT"
},
"text": "annotated PNG images. The annotations consist of the table",
"orig": "annotated PNG images. The annotations consist of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 364.35,
"r_x1": 545.12,
"r_y1": 364.35,
"r_x2": 545.12,
"r_y2": 355.44,
"r_x3": 308.86,
"r_y3": 355.44,
"coord_origin": "TOPLEFT"
},
"text": "structure represented in HTML format, the tokenized text",
"orig": "structure represented in HTML format, the tokenized text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 376.3,
"r_x1": 545.12,
"r_y1": 376.3,
"r_x2": 545.12,
"r_y2": 367.4,
"r_x3": 308.86,
"r_y3": 367.4,
"coord_origin": "TOPLEFT"
},
"text": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 388.26,
"r_x1": 545.12,
"r_y1": 388.26,
"r_x2": 545.12,
"r_y2": 379.35,
"r_x3": 308.86,
"r_y3": 379.35,
"coord_origin": "TOPLEFT"
},
"text": "pearance style of PubTabNet. Depending on its complexity,",
"orig": "pearance style of PubTabNet. Depending on its complexity,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.21,
"r_x1": 545.12,
"r_y1": 400.21,
"r_x2": 545.12,
"r_y2": 391.31,
"r_x3": 308.86,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "a table is characterized as \u201csimple\u201d when it does not contain",
"orig": "a table is characterized as \u201csimple\u201d when it does not contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.17,
"r_x1": 545.12,
"r_y1": 412.17,
"r_x2": 545.12,
"r_y2": 403.26,
"r_x3": 308.86,
"r_y3": 403.26,
"coord_origin": "TOPLEFT"
},
"text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.12,
"r_x1": 545.12,
"r_y1": 424.12,
"r_x2": 545.12,
"r_y2": 415.22,
"r_x3": 308.86,
"r_y3": 415.22,
"coord_origin": "TOPLEFT"
},
"text": "dataset is divided into Train and Val splits (roughly 98% and",
"orig": "dataset is divided into Train and Val splits (roughly 98% and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.08,
"r_x1": 545.12,
"r_y1": 436.08,
"r_x2": 545.12,
"r_y2": 427.17,
"r_x3": 308.86,
"r_y3": 427.17,
"coord_origin": "TOPLEFT"
},
"text": "2%). The Train split consists of 54% simple and 46% com-",
"orig": "2%). The Train split consists of 54% simple and 46% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.03,
"r_x1": 545.12,
"r_y1": 448.03,
"r_x2": 545.12,
"r_y2": 439.13,
"r_x3": 308.86,
"r_y3": 439.13,
"coord_origin": "TOPLEFT"
},
"text": "plex tables and the Val split of 51% and 49% respectively.",
"orig": "plex tables and the Val split of 51% and 49% respectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 459.99,
"r_x1": 545.12,
"r_y1": 459.99,
"r_x2": 545.12,
"r_y2": 451.08,
"r_x3": 308.86,
"r_y3": 451.08,
"coord_origin": "TOPLEFT"
},
"text": "The FinTabNet dataset contains 112k tables delivered as",
"orig": "The FinTabNet dataset contains 112k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 471.94,
"r_x1": 545.12,
"r_y1": 471.94,
"r_x2": 545.12,
"r_y2": 463.04,
"r_x3": 308.86,
"r_y3": 463.04,
"coord_origin": "TOPLEFT"
},
"text": "single-page PDF documents with mixed table structures and",
"orig": "single-page PDF documents with mixed table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 483.9,
"r_x1": 545.12,
"r_y1": 483.9,
"r_x2": 545.12,
"r_y2": 474.99,
"r_x3": 308.86,
"r_y3": 474.99,
"coord_origin": "TOPLEFT"
},
"text": "text content. Similarly to the PubTabNet, the annotations",
"orig": "text content. Similarly to the PubTabNet, the annotations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 495.86,
"r_x1": 545.12,
"r_y1": 495.86,
"r_x2": 545.12,
"r_y2": 486.95,
"r_x3": 308.86,
"r_y3": 486.95,
"coord_origin": "TOPLEFT"
},
"text": "of FinTabNet include the table structure in HTML, the to-",
"orig": "of FinTabNet include the table structure in HTML, the to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 507.81,
"r_x1": 545.12,
"r_y1": 507.81,
"r_x2": 545.12,
"r_y2": 498.9,
"r_x3": 308.86,
"r_y3": 498.9,
"coord_origin": "TOPLEFT"
},
"text": "kenized text and the bounding boxes on a table cell basis.",
"orig": "kenized text and the bounding boxes on a table cell basis.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 519.77,
"r_x1": 545.12,
"r_y1": 519.77,
"r_x2": 545.12,
"r_y2": 510.86,
"r_x3": 308.86,
"r_y3": 510.86,
"coord_origin": "TOPLEFT"
},
"text": "The dataset is divided into Train, Test and Val splits (81%,",
"orig": "The dataset is divided into Train, Test and Val splits (81%,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 531.72,
"r_x1": 545.12,
"r_y1": 531.72,
"r_x2": 545.12,
"r_y2": 522.81,
"r_x3": 308.86,
"r_y3": 522.81,
"coord_origin": "TOPLEFT"
},
"text": "9.5%, 9.5%), and each one is almost equally divided into",
"orig": "9.5%, 9.5%), and each one is almost equally divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 543.68,
"r_x1": 545.12,
"r_y1": 543.68,
"r_x2": 545.12,
"r_y2": 534.77,
"r_x3": 308.86,
"r_y3": 534.77,
"coord_origin": "TOPLEFT"
},
"text": "simple and complex tables (Train: 48% simple, 52% com-",
"orig": "simple and complex tables (Train: 48% simple, 52% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 555.63,
"r_x1": 545.12,
"r_y1": 555.63,
"r_x2": 545.12,
"r_y2": 546.72,
"r_x3": 308.86,
"r_y3": 546.72,
"coord_origin": "TOPLEFT"
},
"text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 567.59,
"r_x1": 545.12,
"r_y1": 567.59,
"r_x2": 545.12,
"r_y2": 558.68,
"r_x3": 308.86,
"r_y3": 558.68,
"coord_origin": "TOPLEFT"
},
"text": "47% complex). Finally the TableBank dataset consists of",
"orig": "47% complex). Finally the TableBank dataset consists of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 579.54,
"r_x1": 545.12,
"r_y1": 579.54,
"r_x2": 545.12,
"r_y2": 570.64,
"r_x3": 308.86,
"r_y3": 570.64,
"coord_origin": "TOPLEFT"
},
"text": "145k tables provided as JPEG images. The latter has anno-",
"orig": "145k tables provided as JPEG images. The latter has anno-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 591.5,
"r_x1": 545.11,
"r_y1": 591.5,
"r_x2": 545.11,
"r_y2": 582.59,
"r_x3": 308.86,
"r_y3": 582.59,
"coord_origin": "TOPLEFT"
},
"text": "tations for the table structure, but only few with bounding",
"orig": "tations for the table structure, but only few with bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 603.45,
"r_x1": 545.12,
"r_y1": 603.45,
"r_x2": 545.12,
"r_y2": 594.55,
"r_x3": 308.86,
"r_y3": 594.55,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the table cells. The entire dataset consists of sim-",
"orig": "boxes of the table cells. The entire dataset consists of sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 615.41,
"r_x1": 545.12,
"r_y1": 615.41,
"r_x2": 545.12,
"r_y2": 606.5,
"r_x3": 308.86,
"r_y3": 606.5,
"coord_origin": "TOPLEFT"
},
"text": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"orig": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 627.36,
"r_x1": 348.16,
"r_y1": 627.36,
"r_x2": 348.16,
"r_y2": 618.46,
"r_x3": 308.86,
"r_y3": 618.46,
"coord_origin": "TOPLEFT"
},
"text": "Val splits.",
"orig": "Val splits.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The PubTabNet dataset contains 509k tables delivered as annotated PNG images. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as \"simple\" when it does not contain row spans or column spans, otherwise it is \"complex\". The dataset is divided into Train and Val splits (roughly 98% and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDF documents with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits."
},
{
"label": "text",
"id": 4,
"page_no": 2,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.86,
"t": 632.51,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 641.42,
"r_x1": 545.11,
"r_y1": 641.42,
"r_x2": 545.11,
"r_y2": 632.51,
"r_x3": 320.82,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "Due to the heterogeneity across the dataset formats, it",
"orig": "Due to the heterogeneity across the dataset formats, it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.38,
"r_x1": 545.12,
"r_y1": 653.38,
"r_x2": 545.12,
"r_y2": 644.47,
"r_x3": 308.86,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "was necessary to combine all available data into one homog-",
"orig": "was necessary to combine all available data into one homog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.33,
"r_x1": 545.12,
"r_y1": 665.33,
"r_x2": 545.12,
"r_y2": 656.42,
"r_x3": 308.86,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "enized dataset before we could train our models for practi-",
"orig": "enized dataset before we could train our models for practi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "cal purposes. Given the size of PubTabNet, we adopted its",
"orig": "cal purposes. Given the size of PubTabNet, we adopted its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "annotation format and we extracted and converted all tables",
"orig": "annotation format and we extracted and converted all tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "as PNG images with a resolution of 72 dpi. Additionally,",
"orig": "as PNG images with a resolution of 72 dpi. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "we have filtered out tables with extreme sizes due to small",
"orig": "we have filtered out tables with extreme sizes due to small",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small"
},
{
"label": "page_footer",
"id": 11,
"page_no": 2,
"cluster": {
"id": 11,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3"
}
],
"body": [
{
"label": "text",
"id": 10,
"page_no": 2,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 250.15,
"b": 84.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 250.15,
"r_y1": 84.11,
"r_x2": 250.15,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder which is constrained to the table-tags.",
"orig": "tag-decoder which is constrained to the table-tags.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "tag-decoder which is constrained to the table-tags."
},
{
"label": "text",
"id": 5,
"page_no": 2,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 87.22,
"r": 286.37,
"b": 275.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.982,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 96.13,
"r_x1": 70.37,
"r_y1": 96.13,
"r_x2": 70.37,
"r_y2": 87.22,
"r_x3": 62.07,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.93,
"r_y0": 96.13,
"r_x1": 110.95,
"r_y1": 96.13,
"r_x2": 110.95,
"r_y2": 87.22,
"r_x3": 76.93,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "practice,",
"orig": "practice,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.54,
"r_y0": 96.13,
"r_x1": 136.26,
"r_y1": 96.13,
"r_x2": 136.26,
"r_y2": 87.22,
"r_x3": 118.54,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "both",
"orig": "both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.82,
"r_y0": 96.13,
"r_x1": 175.37,
"r_y1": 96.13,
"r_x2": 175.37,
"r_y2": 87.22,
"r_x3": 142.82,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "network",
"orig": "network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.95,
"r_y0": 96.13,
"r_x1": 232.84,
"r_y1": 96.13,
"r_x2": 232.84,
"r_y2": 87.22,
"r_x3": 181.95,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "architectures",
"orig": "architectures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.41,
"r_y0": 96.13,
"r_x1": 265.41,
"r_y1": 96.13,
"r_x2": 265.41,
"r_y2": 87.22,
"r_x3": 239.41,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "(IETD",
"orig": "(IETD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 271.98,
"r_y0": 96.13,
"r_x1": 286.36,
"r_y1": 96.13,
"r_x2": 286.36,
"r_y2": 87.22,
"r_x3": 271.98,
"r_y3": 87.22,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.08,
"r_x1": 286.37,
"r_y1": 108.08,
"r_x2": 286.37,
"r_y2": 99.17,
"r_x3": 50.11,
"r_y3": 99.17,
"coord_origin": "TOPLEFT"
},
"text": "IEDD) require an implicit, custom trained object-character-",
"orig": "IEDD) require an implicit, custom trained object-character-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 120.04,
"r_x1": 286.37,
"r_y1": 120.04,
"r_x2": 286.37,
"r_y2": 111.13,
"r_x3": 50.11,
"r_y3": 111.13,
"coord_origin": "TOPLEFT"
},
"text": "recognition (OCR) to obtain the content of the table-cells.",
"orig": "recognition (OCR) to obtain the content of the table-cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.99,
"r_x1": 286.37,
"r_y1": 131.99,
"r_x2": 286.37,
"r_y2": 123.09,
"r_x3": 50.11,
"r_y3": 123.09,
"coord_origin": "TOPLEFT"
},
"text": "In the case of IETD, this OCR engine is implicit in the de-",
"orig": "In the case of IETD, this OCR engine is implicit in the de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 143.95,
"r_x1": 286.37,
"r_y1": 143.95,
"r_x2": 286.37,
"r_y2": 135.04,
"r_x3": 50.11,
"r_y3": 135.04,
"coord_origin": "TOPLEFT"
},
"text": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"orig": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 155.9,
"r_x1": 286.37,
"r_y1": 155.9,
"r_x2": 286.37,
"r_y2": 147.0,
"r_x3": 50.11,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "bedded in the content-decoder. This reliance on a custom,",
"orig": "bedded in the content-decoder. This reliance on a custom,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 167.86,
"r_x1": 286.37,
"r_y1": 167.86,
"r_x2": 286.37,
"r_y2": 158.95,
"r_x3": 50.11,
"r_y3": 158.95,
"coord_origin": "TOPLEFT"
},
"text": "implicit OCR decoder is of course problematic. OCR is a",
"orig": "implicit OCR decoder is of course problematic. OCR is a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 179.81,
"r_x1": 286.37,
"r_y1": 179.81,
"r_x2": 286.37,
"r_y2": 170.91,
"r_x3": 50.11,
"r_y3": 170.91,
"coord_origin": "TOPLEFT"
},
"text": "well known and extremely tough problem, that often needs",
"orig": "well known and extremely tough problem, that often needs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 191.77,
"r_x1": 286.37,
"r_y1": 191.77,
"r_x2": 286.37,
"r_y2": 182.86,
"r_x3": 50.11,
"r_y3": 182.86,
"coord_origin": "TOPLEFT"
},
"text": "custom training for each individual language. However, the",
"orig": "custom training for each individual language. However, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 203.72,
"r_x1": 286.37,
"r_y1": 203.72,
"r_x2": 286.37,
"r_y2": 194.82,
"r_x3": 50.11,
"r_y3": 194.82,
"coord_origin": "TOPLEFT"
},
"text": "limited availability for non-english content in the current",
"orig": "limited availability for non-english content in the current",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 215.68,
"r_x1": 286.37,
"r_y1": 215.68,
"r_x2": 286.37,
"r_y2": 206.77,
"r_x3": 50.11,
"r_y3": 206.77,
"coord_origin": "TOPLEFT"
},
"text": "datasets, makes it impractical to apply the IETD and IEDD",
"orig": "datasets, makes it impractical to apply the IETD and IEDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 227.63,
"r_x1": 286.37,
"r_y1": 227.63,
"r_x2": 286.37,
"r_y2": 218.73,
"r_x3": 50.11,
"r_y3": 218.73,
"coord_origin": "TOPLEFT"
},
"text": "methods on tables with other languages. Additionally, OCR",
"orig": "methods on tables with other languages. Additionally, OCR",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 239.59,
"r_x1": 286.37,
"r_y1": 239.59,
"r_x2": 286.37,
"r_y2": 230.68,
"r_x3": 50.11,
"r_y3": 230.68,
"coord_origin": "TOPLEFT"
},
"text": "can be completely omitted if the tables originate from pro-",
"orig": "can be completely omitted if the tables originate from pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 251.54,
"r_x1": 286.37,
"r_y1": 251.54,
"r_x2": 286.37,
"r_y2": 242.64,
"r_x3": 50.11,
"r_y3": 242.64,
"coord_origin": "TOPLEFT"
},
"text": "grammatic PDF documents with known positions of each",
"orig": "grammatic PDF documents with known positions of each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 263.5,
"r_x1": 286.37,
"r_y1": 263.5,
"r_x2": 286.37,
"r_y2": 254.59,
"r_x3": 50.11,
"r_y3": 254.59,
"coord_origin": "TOPLEFT"
},
"text": "cell. The latter was the inspiration for the work of this pa-",
"orig": "cell. The latter was the inspiration for the work of this pa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 275.45,
"r_x1": 64.78,
"r_y1": 275.45,
"r_x2": 64.78,
"r_y2": 266.55,
"r_x3": 50.11,
"r_y3": 266.55,
"coord_origin": "TOPLEFT"
},
"text": "per.",
"orig": "per.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper."
},
{
"label": "text",
"id": 0,
"page_no": 2,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 278.44,
"r": 286.37,
"b": 490.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 287.4,
"r_x1": 171.57,
"r_y1": 287.4,
"r_x2": 171.57,
"r_y2": 278.44,
"r_x3": 62.07,
"r_y3": 278.44,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.57,
"r_y0": 287.47,
"r_x1": 174.34,
"r_y1": 287.47,
"r_x2": 174.34,
"r_y2": 278.56,
"r_x3": 171.57,
"r_y3": 278.56,
"coord_origin": "TOPLEFT"
},
"text": ":",
"orig": ":",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.19,
"r_y0": 287.47,
"r_x1": 286.36,
"r_y1": 287.47,
"r_x2": 286.36,
"r_y2": 278.56,
"r_x3": 185.19,
"r_y3": 278.56,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 299.42,
"r_x1": 286.37,
"r_y1": 299.42,
"r_x2": 286.37,
"r_y2": 290.51,
"r_x3": 50.11,
"r_y3": 290.51,
"coord_origin": "TOPLEFT"
},
"text": "(GNN\u2019s) take a radically different approach to table-",
"orig": "(GNN\u2019s) take a radically different approach to table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 311.38,
"r_x1": 131.17,
"r_y1": 311.38,
"r_x2": 131.17,
"r_y2": 302.47,
"r_x3": 50.11,
"r_y3": 302.47,
"coord_origin": "TOPLEFT"
},
"text": "structure extraction.",
"orig": "structure extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.85,
"r_y0": 311.38,
"r_x1": 286.37,
"r_y1": 311.38,
"r_x2": 286.37,
"r_y2": 302.47,
"r_x3": 138.85,
"r_y3": 302.47,
"coord_origin": "TOPLEFT"
},
"text": "Note that one table cell can consti-",
"orig": "Note that one table cell can consti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 323.33,
"r_x1": 286.37,
"r_y1": 323.33,
"r_x2": 286.37,
"r_y2": 314.42,
"r_x3": 50.11,
"r_y3": 314.42,
"coord_origin": "TOPLEFT"
},
"text": "tute out of multiple text-cells. To obtain the table-structure,",
"orig": "tute out of multiple text-cells. To obtain the table-structure,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 335.29,
"r_x1": 286.37,
"r_y1": 335.29,
"r_x2": 286.37,
"r_y2": 326.38,
"r_x3": 50.11,
"r_y3": 326.38,
"coord_origin": "TOPLEFT"
},
"text": "one creates an initial graph, where each of the text-cells",
"orig": "one creates an initial graph, where each of the text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 347.24,
"r_x1": 286.37,
"r_y1": 347.24,
"r_x2": 286.37,
"r_y2": 338.33,
"r_x3": 50.11,
"r_y3": 338.33,
"coord_origin": "TOPLEFT"
},
"text": "becomes a node in the graph similar to [33, 34, 2]. Each",
"orig": "becomes a node in the graph similar to [33, 34, 2]. Each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.2,
"r_x1": 286.37,
"r_y1": 359.2,
"r_x2": 286.37,
"r_y2": 350.29,
"r_x3": 50.11,
"r_y3": 350.29,
"coord_origin": "TOPLEFT"
},
"text": "node is then associated with en embedding vector coming",
"orig": "node is then associated with en embedding vector coming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.15,
"r_x1": 286.37,
"r_y1": 371.15,
"r_x2": 286.37,
"r_y2": 362.25,
"r_x3": 50.11,
"r_y3": 362.25,
"coord_origin": "TOPLEFT"
},
"text": "from the encoded image, its coordinates and the encoded",
"orig": "from the encoded image, its coordinates and the encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 383.11,
"r_x1": 286.37,
"r_y1": 383.11,
"r_x2": 286.37,
"r_y2": 374.2,
"r_x3": 50.11,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "text. Furthermore, nodes that represent adjacent text-cells",
"orig": "text. Furthermore, nodes that represent adjacent text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 395.06,
"r_x1": 286.37,
"r_y1": 395.06,
"r_x2": 286.37,
"r_y2": 386.16,
"r_x3": 50.11,
"r_y3": 386.16,
"coord_origin": "TOPLEFT"
},
"text": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 407.02,
"r_x1": 286.37,
"r_y1": 407.02,
"r_x2": 286.37,
"r_y2": 398.11,
"r_x3": 50.11,
"r_y3": 398.11,
"coord_origin": "TOPLEFT"
},
"text": "methods take the image as an input, but also the position of",
"orig": "methods take the image as an input, but also the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 418.97,
"r_x1": 286.37,
"r_y1": 418.97,
"r_x2": 286.37,
"r_y2": 410.07,
"r_x3": 50.11,
"r_y3": 410.07,
"coord_origin": "TOPLEFT"
},
"text": "the text-cells and their content [18]. The purpose of a GCN",
"orig": "the text-cells and their content [18]. The purpose of a GCN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 430.93,
"r_x1": 286.37,
"r_y1": 430.93,
"r_x2": 286.37,
"r_y2": 422.02,
"r_x3": 50.11,
"r_y3": 422.02,
"coord_origin": "TOPLEFT"
},
"text": "is to transform the input graph into a new graph, which re-",
"orig": "is to transform the input graph into a new graph, which re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 442.88,
"r_x1": 198.24,
"r_y1": 442.88,
"r_x2": 198.24,
"r_y2": 433.98,
"r_x3": 50.11,
"r_y3": 433.98,
"coord_origin": "TOPLEFT"
},
"text": "places the old links with new ones.",
"orig": "places the old links with new ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.93,
"r_y0": 442.88,
"r_x1": 286.37,
"r_y1": 442.88,
"r_x2": 286.37,
"r_y2": 433.98,
"r_x3": 205.93,
"r_y3": 433.98,
"coord_origin": "TOPLEFT"
},
"text": "The new links then",
"orig": "The new links then",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 454.84,
"r_x1": 286.37,
"r_y1": 454.84,
"r_x2": 286.37,
"r_y2": 445.93,
"r_x3": 50.11,
"r_y3": 445.93,
"coord_origin": "TOPLEFT"
},
"text": "represent the table-structure. With this approach, one can",
"orig": "represent the table-structure. With this approach, one can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 466.79,
"r_x1": 286.37,
"r_y1": 466.79,
"r_x2": 286.37,
"r_y2": 457.89,
"r_x3": 50.11,
"r_y3": 457.89,
"coord_origin": "TOPLEFT"
},
"text": "avoid the need to build custom OCR decoders. However,",
"orig": "avoid the need to build custom OCR decoders. However,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 478.75,
"r_x1": 286.37,
"r_y1": 478.75,
"r_x2": 286.37,
"r_y2": 469.84,
"r_x3": 50.11,
"r_y3": 469.84,
"coord_origin": "TOPLEFT"
},
"text": "the quality of the reconstructed structure is not comparable",
"orig": "the quality of the reconstructed structure is not comparable",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 490.7,
"r_x1": 186.5,
"r_y1": 490.7,
"r_x2": 186.5,
"r_y2": 481.8,
"r_x3": 50.11,
"r_y3": 481.8,
"coord_origin": "TOPLEFT"
},
"text": "to the current state-of-the-art [18].",
"orig": "to the current state-of-the-art [18].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]."
},
{
"label": "text",
"id": 1,
"page_no": 2,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 493.69,
"r": 286.37,
"b": 622.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 502.65,
"r_x1": 252.88,
"r_y1": 502.65,
"r_x2": 252.88,
"r_y2": 493.69,
"r_x3": 62.07,
"r_y3": 493.69,
"coord_origin": "TOPLEFT"
},
"text": "Hybrid Deep Learning-Rule-Based approach",
"orig": "Hybrid Deep Learning-Rule-Based approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 252.88,
"r_y0": 502.71,
"r_x1": 286.37,
"r_y1": 502.71,
"r_x2": 286.37,
"r_y2": 493.81,
"r_x3": 252.88,
"r_y3": 493.81,
"coord_origin": "TOPLEFT"
},
"text": ": A pop-",
"orig": ": A pop-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 514.67,
"r_x1": 286.37,
"r_y1": 514.67,
"r_x2": 286.37,
"r_y2": 505.76,
"r_x3": 50.11,
"r_y3": 505.76,
"coord_origin": "TOPLEFT"
},
"text": "ular current model for table-structure identification is the",
"orig": "ular current model for table-structure identification is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 526.62,
"r_x1": 286.37,
"r_y1": 526.62,
"r_x2": 286.37,
"r_y2": 517.72,
"r_x3": 50.11,
"r_y3": 517.72,
"coord_origin": "TOPLEFT"
},
"text": "use of a hybrid Deep Learning-Rule-Based approach similar",
"orig": "use of a hybrid Deep Learning-Rule-Based approach similar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 538.58,
"r_x1": 286.37,
"r_y1": 538.58,
"r_x2": 286.37,
"r_y2": 529.67,
"r_x3": 50.11,
"r_y3": 529.67,
"coord_origin": "TOPLEFT"
},
"text": "to [27, 29]. In this approach, one first detects the position of",
"orig": "to [27, 29]. In this approach, one first detects the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 550.54,
"r_x1": 286.37,
"r_y1": 550.54,
"r_x2": 286.37,
"r_y2": 541.63,
"r_x3": 50.11,
"r_y3": 541.63,
"coord_origin": "TOPLEFT"
},
"text": "the table-cells with object detection (e.g. YoloVx or Mask-",
"orig": "the table-cells with object detection (e.g. YoloVx or Mask-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 562.49,
"r_x1": 286.37,
"r_y1": 562.49,
"r_x2": 286.37,
"r_y2": 553.58,
"r_x3": 50.11,
"r_y3": 553.58,
"coord_origin": "TOPLEFT"
},
"text": "RCNN), then classifies the table into different types (from",
"orig": "RCNN), then classifies the table into different types (from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 574.45,
"r_x1": 286.37,
"r_y1": 574.45,
"r_x2": 286.37,
"r_y2": 565.54,
"r_x3": 50.11,
"r_y3": 565.54,
"coord_origin": "TOPLEFT"
},
"text": "its images) and finally uses different rule-sets to obtain",
"orig": "its images) and finally uses different rule-sets to obtain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 586.4,
"r_x1": 286.37,
"r_y1": 586.4,
"r_x2": 286.37,
"r_y2": 577.49,
"r_x3": 50.11,
"r_y3": 577.49,
"coord_origin": "TOPLEFT"
},
"text": "its table-structure. Currently, this approach achieves state-",
"orig": "its table-structure. Currently, this approach achieves state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 598.36,
"r_x1": 286.37,
"r_y1": 598.36,
"r_x2": 286.37,
"r_y2": 589.45,
"r_x3": 50.11,
"r_y3": 589.45,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art results, but is not an end-to-end deep-learning",
"orig": "of-the-art results, but is not an end-to-end deep-learning",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 610.31,
"r_x1": 286.37,
"r_y1": 610.31,
"r_x2": 286.37,
"r_y2": 601.4,
"r_x3": 50.11,
"r_y3": 601.4,
"coord_origin": "TOPLEFT"
},
"text": "method. As such, new rules need to be written if different",
"orig": "method. As such, new rules need to be written if different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 622.27,
"r_x1": 175.99,
"r_y1": 622.27,
"r_x2": 175.99,
"r_y2": 613.36,
"r_x3": 50.11,
"r_y3": 613.36,
"coord_origin": "TOPLEFT"
},
"text": "types of tables are encountered.",
"orig": "types of tables are encountered.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Hybrid Deep Learning-Rule-Based approach : A popular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered."
},
{
"label": "section_header",
"id": 8,
"page_no": 2,
"cluster": {
"id": 8,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 635.94,
"r": 105.23,
"b": 646.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 646.69,
"r_x1": 57.82,
"r_y1": 646.69,
"r_x2": 57.82,
"r_y2": 635.94,
"r_x3": 50.11,
"r_y3": 635.94,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.11,
"r_y0": 646.69,
"r_x1": 105.23,
"r_y1": 646.69,
"r_x2": 105.23,
"r_y2": 635.94,
"r_x3": 68.11,
"r_y3": 635.94,
"coord_origin": "TOPLEFT"
},
"text": "Datasets",
"orig": "Datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Datasets"
},
{
"label": "text",
"id": 3,
"page_no": 2,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 656.43,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 665.33,
"r_x1": 286.36,
"r_y1": 665.33,
"r_x2": 286.36,
"r_y2": 656.43,
"r_x3": 62.07,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "We rely on large-scale datasets such as PubTabNet [37],",
"orig": "We rely on large-scale datasets such as PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] datasets to train and",
"orig": "FinTabNet [36], and TableBank [17] datasets to train and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "evaluate our models. These datasets span over various ap-",
"orig": "evaluate our models. These datasets span over various ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 166.25,
"r_y1": 701.2,
"r_x2": 166.25,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "pearance styles and content.",
"orig": "pearance styles and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 173.69,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 173.69,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "We also introduce our own",
"orig": "We also introduce our own",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "synthetically generated SynthTabNet dataset to fix an im-",
"orig": "synthetically generated SynthTabNet dataset to fix an im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-"
},
{
"label": "picture",
"id": 6,
"page_no": 2,
"cluster": {
"id": 6,
"label": "picture",
"bbox": {
"l": 312.1,
"t": 78.44,
"r": 550.39,
"b": 250.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.975,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.56,
"r_x1": 486.85,
"r_y1": 88.56,
"r_x2": 486.85,
"r_y2": 79.81,
"r_x3": 380.8,
"r_y3": 79.81,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.77,
"r_y0": 250.77,
"r_x1": 469.79,
"r_y1": 250.77,
"r_x2": 469.79,
"r_y2": 242.03,
"r_x3": 396.77,
"r_y3": 242.03,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.98,
"r_y0": 239.25,
"r_x1": 324.79,
"r_y1": 239.25,
"r_x2": 324.79,
"r_y2": 233.42,
"r_x3": 320.98,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.48,
"r_y0": 239.25,
"r_x1": 418.11,
"r_y1": 239.25,
"r_x2": 418.11,
"r_y2": 233.42,
"r_x3": 410.48,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.85,
"r_y0": 239.25,
"r_x1": 508.48,
"r_y1": 239.25,
"r_x2": 508.48,
"r_y2": 233.42,
"r_x3": 500.85,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.25,
"r_x1": 372.93,
"r_y1": 239.25,
"r_x2": 372.93,
"r_y2": 233.42,
"r_x3": 365.3,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.67,
"r_y0": 239.25,
"r_x1": 463.3,
"r_y1": 239.25,
"r_x2": 463.3,
"r_y2": 233.42,
"r_x3": 455.67,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.04,
"r_y0": 239.25,
"r_x1": 549.67,
"r_y1": 239.25,
"r_x2": 549.67,
"r_y2": 233.42,
"r_x3": 542.04,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.04,
"r_y0": 236.28,
"r_x1": 319.86,
"r_y1": 236.28,
"r_x2": 319.86,
"r_y2": 230.45,
"r_x3": 316.04,
"r_y3": 230.45,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.63,
"r_y0": 204.52,
"r_x1": 316.44,
"r_y1": 204.52,
"r_x2": 316.44,
"r_y2": 198.69,
"r_x3": 312.63,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.44,
"r_y0": 204.52,
"r_x1": 320.26,
"r_y1": 204.52,
"r_x2": 320.26,
"r_y2": 198.69,
"r_x3": 316.44,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.15,
"r_y0": 173.93,
"r_x1": 316.97,
"r_y1": 173.93,
"r_x2": 316.97,
"r_y2": 168.1,
"r_x3": 313.15,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.96,
"r_y0": 173.93,
"r_x1": 320.78,
"r_y1": 173.93,
"r_x2": 320.78,
"r_y2": 168.1,
"r_x3": 316.96,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.93,
"r_y0": 142.42,
"r_x1": 316.75,
"r_y1": 142.42,
"r_x2": 316.75,
"r_y2": 136.59,
"r_x3": 312.93,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.74,
"r_y0": 142.42,
"r_x1": 320.56,
"r_y1": 142.42,
"r_x2": 320.56,
"r_y2": 136.59,
"r_x3": 316.74,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 111.43,
"r_x1": 316.3,
"r_y1": 111.43,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.48,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.43,
"r_x1": 320.11,
"r_y1": 111.43,
"r_x2": 320.11,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 218.09,
"r_x1": 316.3,
"r_y1": 218.09,
"r_x2": 316.3,
"r_y2": 212.26,
"r_x3": 312.48,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.09,
"r_x1": 320.11,
"r_y1": 218.09,
"r_x2": 320.11,
"r_y2": 212.26,
"r_x3": 316.3,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.08,
"r_y0": 189.55,
"r_x1": 316.89,
"r_y1": 189.55,
"r_x2": 316.89,
"r_y2": 183.72,
"r_x3": 313.08,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.89,
"r_y0": 189.55,
"r_x1": 320.71,
"r_y1": 189.55,
"r_x2": 320.71,
"r_y2": 183.72,
"r_x3": 316.89,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.76,
"r_y0": 158.31,
"r_x1": 316.58,
"r_y1": 158.31,
"r_x2": 316.58,
"r_y2": 152.47,
"r_x3": 312.76,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.58,
"r_y0": 158.31,
"r_x1": 320.39,
"r_y1": 158.31,
"r_x2": 320.39,
"r_y2": 152.47,
"r_x3": 316.58,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.01,
"r_y1": 126.4,
"r_x2": 316.01,
"r_y2": 120.57,
"r_x3": 312.2,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.01,
"r_y0": 126.4,
"r_x1": 319.83,
"r_y1": 126.4,
"r_x2": 319.83,
"r_y2": 120.57,
"r_x3": 316.01,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.82,
"r_y0": 95.94,
"r_x1": 316.63,
"r_y1": 95.94,
"r_x2": 316.63,
"r_y2": 90.11,
"r_x3": 312.82,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.63,
"r_y0": 95.94,
"r_x1": 320.45,
"r_y1": 95.94,
"r_x2": 320.45,
"r_y2": 90.11,
"r_x3": 316.63,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.17,
"r_y0": 230.02,
"r_x1": 536.94,
"r_y1": 230.02,
"r_x2": 536.94,
"r_y2": 222.73,
"r_x3": 532.17,
"r_y3": 222.73,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.88,
"r_y0": 115.56,
"r_x1": 547.61,
"r_y1": 115.56,
"r_x2": 547.61,
"r_y2": 108.27,
"r_x3": 532.88,
"r_y3": 108.27,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.77,
"r_y0": 138.07,
"r_x1": 542.74,
"r_y1": 138.07,
"r_x2": 542.74,
"r_y2": 130.78,
"r_x3": 532.77,
"r_y3": 130.78,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.21,
"r_x1": 542.76,
"r_y1": 161.21,
"r_x2": 542.76,
"r_y2": 153.92,
"r_x3": 532.8,
"r_y3": 153.92,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.57,
"r_y0": 184.05,
"r_x1": 542.54,
"r_y1": 184.05,
"r_x2": 542.54,
"r_y2": 176.76,
"r_x3": 532.57,
"r_y3": 176.76,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.15,
"r_y0": 206.94,
"r_x1": 542.11,
"r_y1": 206.94,
"r_x2": 542.11,
"r_y2": 199.65,
"r_x3": 532.15,
"r_y3": 199.65,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 380.8,
"t": 79.81,
"r": 486.85,
"b": 88.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.569,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.56,
"r_x1": 486.85,
"r_y1": 88.56,
"r_x2": 486.85,
"r_y2": 79.81,
"r_x3": 380.8,
"r_y3": 79.81,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 396.77,
"t": 242.03,
"r": 469.79,
"b": 250.77,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.77,
"r_y0": 250.77,
"r_x1": 469.79,
"r_y1": 250.77,
"r_x2": 469.79,
"r_y2": 242.03,
"r_x3": 396.77,
"r_y3": 242.03,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "text",
"bbox": {
"l": 320.98,
"t": 233.42,
"r": 324.79,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.98,
"r_y0": 239.25,
"r_x1": 324.79,
"r_y1": 239.25,
"r_x2": 324.79,
"r_y2": 233.42,
"r_x3": 320.98,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 410.48,
"t": 233.42,
"r": 418.11,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.48,
"r_y0": 239.25,
"r_x1": 418.11,
"r_y1": 239.25,
"r_x2": 418.11,
"r_y2": 233.42,
"r_x3": 410.48,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 500.85,
"t": 233.42,
"r": 508.48,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.85,
"r_y0": 239.25,
"r_x1": 508.48,
"r_y1": 239.25,
"r_x2": 508.48,
"r_y2": 233.42,
"r_x3": 500.85,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 365.3,
"t": 233.42,
"r": 372.93,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.25,
"r_x1": 372.93,
"r_y1": 239.25,
"r_x2": 372.93,
"r_y2": 233.42,
"r_x3": 365.3,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 455.67,
"t": 233.42,
"r": 463.3,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.67,
"r_y0": 239.25,
"r_x1": 463.3,
"r_y1": 239.25,
"r_x2": 463.3,
"r_y2": 233.42,
"r_x3": 455.67,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 542.04,
"t": 233.42,
"r": 549.67,
"b": 239.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.04,
"r_y0": 239.25,
"r_x1": 549.67,
"r_y1": 239.25,
"r_x2": 549.67,
"r_y2": 233.42,
"r_x3": 542.04,
"r_y3": 233.42,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 316.04,
"t": 230.45,
"r": 319.86,
"b": 236.28,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.04,
"r_y0": 236.28,
"r_x1": 319.86,
"r_y1": 236.28,
"r_x2": 319.86,
"r_y2": 230.45,
"r_x3": 316.04,
"r_y3": 230.45,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 312.63,
"t": 198.69,
"r": 316.44,
"b": 204.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.63,
"r_y0": 204.52,
"r_x1": 316.44,
"r_y1": 204.52,
"r_x2": 316.44,
"r_y2": 198.69,
"r_x3": 312.63,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 316.44,
"t": 198.69,
"r": 320.26,
"b": 204.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.44,
"r_y0": 204.52,
"r_x1": 320.26,
"r_y1": 204.52,
"r_x2": 320.26,
"r_y2": 198.69,
"r_x3": 316.44,
"r_y3": 198.69,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 313.15,
"t": 168.1,
"r": 316.97,
"b": 173.93,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.15,
"r_y0": 173.93,
"r_x1": 316.97,
"r_y1": 173.93,
"r_x2": 316.97,
"r_y2": 168.1,
"r_x3": 313.15,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 316.96,
"t": 168.1,
"r": 320.78,
"b": 173.93,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.96,
"r_y0": 173.93,
"r_x1": 320.78,
"r_y1": 173.93,
"r_x2": 320.78,
"r_y2": 168.1,
"r_x3": 316.96,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 312.93,
"t": 136.59,
"r": 316.75,
"b": 142.42,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.93,
"r_y0": 142.42,
"r_x1": 316.75,
"r_y1": 142.42,
"r_x2": 316.75,
"r_y2": 136.59,
"r_x3": 312.93,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 316.74,
"t": 136.59,
"r": 320.56,
"b": 142.42,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.74,
"r_y0": 142.42,
"r_x1": 320.56,
"r_y1": 142.42,
"r_x2": 320.56,
"r_y2": 136.59,
"r_x3": 316.74,
"r_y3": 136.59,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 312.48,
"t": 105.6,
"r": 316.3,
"b": 111.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 111.43,
"r_x1": 316.3,
"r_y1": 111.43,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.48,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 316.3,
"t": 105.6,
"r": 320.11,
"b": 111.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.43,
"r_x1": 320.11,
"r_y1": 111.43,
"r_x2": 320.11,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 312.48,
"t": 212.26,
"r": 316.3,
"b": 218.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.48,
"r_y0": 218.09,
"r_x1": 316.3,
"r_y1": 218.09,
"r_x2": 316.3,
"r_y2": 212.26,
"r_x3": 312.48,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 316.3,
"t": 212.26,
"r": 320.11,
"b": 218.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.09,
"r_x1": 320.11,
"r_y1": 218.09,
"r_x2": 320.11,
"r_y2": 212.26,
"r_x3": 316.3,
"r_y3": 212.26,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 313.08,
"t": 183.72,
"r": 316.89,
"b": 189.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.08,
"r_y0": 189.55,
"r_x1": 316.89,
"r_y1": 189.55,
"r_x2": 316.89,
"r_y2": 183.72,
"r_x3": 313.08,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 316.89,
"t": 183.72,
"r": 320.71,
"b": 189.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.89,
"r_y0": 189.55,
"r_x1": 320.71,
"r_y1": 189.55,
"r_x2": 320.71,
"r_y2": 183.72,
"r_x3": 316.89,
"r_y3": 183.72,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 312.76,
"t": 152.47,
"r": 316.58,
"b": 158.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.76,
"r_y0": 158.31,
"r_x1": 316.58,
"r_y1": 158.31,
"r_x2": 316.58,
"r_y2": 152.47,
"r_x3": 312.76,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 316.58,
"t": 152.47,
"r": 320.39,
"b": 158.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.58,
"r_y0": 158.31,
"r_x1": 320.39,
"r_y1": 158.31,
"r_x2": 320.39,
"r_y2": 152.47,
"r_x3": 316.58,
"r_y3": 152.47,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 312.2,
"t": 120.57,
"r": 316.01,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.01,
"r_y1": 126.4,
"r_x2": 316.01,
"r_y2": 120.57,
"r_x3": 312.2,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 316.01,
"t": 120.57,
"r": 319.83,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.01,
"r_y0": 126.4,
"r_x1": 319.83,
"r_y1": 126.4,
"r_x2": 319.83,
"r_y2": 120.57,
"r_x3": 316.01,
"r_y3": 120.57,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 312.82,
"t": 90.11,
"r": 316.63,
"b": 95.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.82,
"r_y0": 95.94,
"r_x1": 316.63,
"r_y1": 95.94,
"r_x2": 316.63,
"r_y2": 90.11,
"r_x3": 312.82,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 316.63,
"t": 90.11,
"r": 320.45,
"b": 95.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.63,
"r_y0": 95.94,
"r_x1": 320.45,
"r_y1": 95.94,
"r_x2": 320.45,
"r_y2": 90.11,
"r_x3": 316.63,
"r_y3": 90.11,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 532.17,
"t": 222.73,
"r": 536.94,
"b": 230.02,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.17,
"r_y0": 230.02,
"r_x1": 536.94,
"r_y1": 230.02,
"r_x2": 536.94,
"r_y2": 222.73,
"r_x3": 532.17,
"r_y3": 222.73,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 532.88,
"t": 108.27,
"r": 547.61,
"b": 115.56,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.88,
"r_y0": 115.56,
"r_x1": 547.61,
"r_y1": 115.56,
"r_x2": 547.61,
"r_y2": 108.27,
"r_x3": 532.88,
"r_y3": 108.27,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 532.77,
"t": 130.78,
"r": 542.74,
"b": 138.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.77,
"r_y0": 138.07,
"r_x1": 542.74,
"r_y1": 138.07,
"r_x2": 542.74,
"r_y2": 130.78,
"r_x3": 532.77,
"r_y3": 130.78,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 532.8,
"t": 153.92,
"r": 542.76,
"b": 161.21,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.21,
"r_x1": 542.76,
"r_y1": 161.21,
"r_x2": 542.76,
"r_y2": 153.92,
"r_x3": 532.8,
"r_y3": 153.92,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 532.57,
"t": 176.76,
"r": 542.54,
"b": 184.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.57,
"r_y0": 184.05,
"r_x1": 542.54,
"r_y1": 184.05,
"r_x2": 542.54,
"r_y2": 176.76,
"r_x3": 532.57,
"r_y3": 176.76,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 532.15,
"t": 199.65,
"r": 542.11,
"b": 206.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.15,
"r_y0": 206.94,
"r_x1": 542.11,
"r_y1": 206.94,
"r_x2": 542.11,
"r_y2": 199.65,
"r_x3": 532.15,
"r_y3": 199.65,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 7,
"page_no": 2,
"cluster": {
"id": 7,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 267.84,
"r": 545.12,
"b": 288.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.967,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 276.74,
"r_x1": 346.06,
"r_y1": 276.74,
"r_x2": 346.06,
"r_y2": 267.84,
"r_x3": 308.86,
"r_y3": 267.84,
"coord_origin": "TOPLEFT"
},
"text": "Figure 2:",
"orig": "Figure 2:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.49,
"r_y0": 276.74,
"r_x1": 545.12,
"r_y1": 276.74,
"r_x2": 545.12,
"r_y2": 267.84,
"r_x3": 354.49,
"r_y3": 267.84,
"coord_origin": "TOPLEFT"
},
"text": "Distribution of the tables across different table",
"orig": "Distribution of the tables across different table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 288.7,
"r_x1": 498.57,
"r_y1": 288.7,
"r_x2": 498.57,
"r_y2": 279.79,
"r_x3": 308.86,
"r_y3": 279.79,
"coord_origin": "TOPLEFT"
},
"text": "dimensions in PubTabNet + FinTabNet datasets",
"orig": "dimensions in PubTabNet + FinTabNet datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets"
},
{
"label": "text",
"id": 9,
"page_no": 2,
"cluster": {
"id": 9,
"label": "text",
"bbox": {
"l": 308.86,
"t": 317.47,
"r": 437.27,
"b": 326.38,
"coord_origin": "TOPLEFT"
},
"confidence": 0.888,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 326.38,
"r_x1": 437.27,
"r_y1": 326.38,
"r_x2": 437.27,
"r_y2": 317.47,
"r_x3": 308.86,
"r_y3": 317.47,
"coord_origin": "TOPLEFT"
},
"text": "balance in the previous datasets.",
"orig": "balance in the previous datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "balance in the previous datasets."
},
{
"label": "text",
"id": 2,
"page_no": 2,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 331.53,
"r": 545.12,
"b": 627.36,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 340.44,
"r_x1": 545.12,
"r_y1": 340.44,
"r_x2": 545.12,
"r_y2": 331.53,
"r_x3": 320.82,
"r_y3": 331.53,
"coord_origin": "TOPLEFT"
},
"text": "The PubTabNet dataset contains 509k tables delivered as",
"orig": "The PubTabNet dataset contains 509k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 352.39,
"r_x1": 545.12,
"r_y1": 352.39,
"r_x2": 545.12,
"r_y2": 343.49,
"r_x3": 308.86,
"r_y3": 343.49,
"coord_origin": "TOPLEFT"
},
"text": "annotated PNG images. The annotations consist of the table",
"orig": "annotated PNG images. The annotations consist of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 364.35,
"r_x1": 545.12,
"r_y1": 364.35,
"r_x2": 545.12,
"r_y2": 355.44,
"r_x3": 308.86,
"r_y3": 355.44,
"coord_origin": "TOPLEFT"
},
"text": "structure represented in HTML format, the tokenized text",
"orig": "structure represented in HTML format, the tokenized text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 376.3,
"r_x1": 545.12,
"r_y1": 376.3,
"r_x2": 545.12,
"r_y2": 367.4,
"r_x3": 308.86,
"r_y3": 367.4,
"coord_origin": "TOPLEFT"
},
"text": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 388.26,
"r_x1": 545.12,
"r_y1": 388.26,
"r_x2": 545.12,
"r_y2": 379.35,
"r_x3": 308.86,
"r_y3": 379.35,
"coord_origin": "TOPLEFT"
},
"text": "pearance style of PubTabNet. Depending on its complexity,",
"orig": "pearance style of PubTabNet. Depending on its complexity,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.21,
"r_x1": 545.12,
"r_y1": 400.21,
"r_x2": 545.12,
"r_y2": 391.31,
"r_x3": 308.86,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "a table is characterized as \u201csimple\u201d when it does not contain",
"orig": "a table is characterized as \u201csimple\u201d when it does not contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.17,
"r_x1": 545.12,
"r_y1": 412.17,
"r_x2": 545.12,
"r_y2": 403.26,
"r_x3": 308.86,
"r_y3": 403.26,
"coord_origin": "TOPLEFT"
},
"text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.12,
"r_x1": 545.12,
"r_y1": 424.12,
"r_x2": 545.12,
"r_y2": 415.22,
"r_x3": 308.86,
"r_y3": 415.22,
"coord_origin": "TOPLEFT"
},
"text": "dataset is divided into Train and Val splits (roughly 98% and",
"orig": "dataset is divided into Train and Val splits (roughly 98% and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.08,
"r_x1": 545.12,
"r_y1": 436.08,
"r_x2": 545.12,
"r_y2": 427.17,
"r_x3": 308.86,
"r_y3": 427.17,
"coord_origin": "TOPLEFT"
},
"text": "2%). The Train split consists of 54% simple and 46% com-",
"orig": "2%). The Train split consists of 54% simple and 46% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.03,
"r_x1": 545.12,
"r_y1": 448.03,
"r_x2": 545.12,
"r_y2": 439.13,
"r_x3": 308.86,
"r_y3": 439.13,
"coord_origin": "TOPLEFT"
},
"text": "plex tables and the Val split of 51% and 49% respectively.",
"orig": "plex tables and the Val split of 51% and 49% respectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 459.99,
"r_x1": 545.12,
"r_y1": 459.99,
"r_x2": 545.12,
"r_y2": 451.08,
"r_x3": 308.86,
"r_y3": 451.08,
"coord_origin": "TOPLEFT"
},
"text": "The FinTabNet dataset contains 112k tables delivered as",
"orig": "The FinTabNet dataset contains 112k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 471.94,
"r_x1": 545.12,
"r_y1": 471.94,
"r_x2": 545.12,
"r_y2": 463.04,
"r_x3": 308.86,
"r_y3": 463.04,
"coord_origin": "TOPLEFT"
},
"text": "single-page PDF documents with mixed table structures and",
"orig": "single-page PDF documents with mixed table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 483.9,
"r_x1": 545.12,
"r_y1": 483.9,
"r_x2": 545.12,
"r_y2": 474.99,
"r_x3": 308.86,
"r_y3": 474.99,
"coord_origin": "TOPLEFT"
},
"text": "text content. Similarly to the PubTabNet, the annotations",
"orig": "text content. Similarly to the PubTabNet, the annotations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 495.86,
"r_x1": 545.12,
"r_y1": 495.86,
"r_x2": 545.12,
"r_y2": 486.95,
"r_x3": 308.86,
"r_y3": 486.95,
"coord_origin": "TOPLEFT"
},
"text": "of FinTabNet include the table structure in HTML, the to-",
"orig": "of FinTabNet include the table structure in HTML, the to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 507.81,
"r_x1": 545.12,
"r_y1": 507.81,
"r_x2": 545.12,
"r_y2": 498.9,
"r_x3": 308.86,
"r_y3": 498.9,
"coord_origin": "TOPLEFT"
},
"text": "kenized text and the bounding boxes on a table cell basis.",
"orig": "kenized text and the bounding boxes on a table cell basis.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 519.77,
"r_x1": 545.12,
"r_y1": 519.77,
"r_x2": 545.12,
"r_y2": 510.86,
"r_x3": 308.86,
"r_y3": 510.86,
"coord_origin": "TOPLEFT"
},
"text": "The dataset is divided into Train, Test and Val splits (81%,",
"orig": "The dataset is divided into Train, Test and Val splits (81%,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 531.72,
"r_x1": 545.12,
"r_y1": 531.72,
"r_x2": 545.12,
"r_y2": 522.81,
"r_x3": 308.86,
"r_y3": 522.81,
"coord_origin": "TOPLEFT"
},
"text": "9.5%, 9.5%), and each one is almost equally divided into",
"orig": "9.5%, 9.5%), and each one is almost equally divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 543.68,
"r_x1": 545.12,
"r_y1": 543.68,
"r_x2": 545.12,
"r_y2": 534.77,
"r_x3": 308.86,
"r_y3": 534.77,
"coord_origin": "TOPLEFT"
},
"text": "simple and complex tables (Train: 48% simple, 52% com-",
"orig": "simple and complex tables (Train: 48% simple, 52% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 555.63,
"r_x1": 545.12,
"r_y1": 555.63,
"r_x2": 545.12,
"r_y2": 546.72,
"r_x3": 308.86,
"r_y3": 546.72,
"coord_origin": "TOPLEFT"
},
"text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 567.59,
"r_x1": 545.12,
"r_y1": 567.59,
"r_x2": 545.12,
"r_y2": 558.68,
"r_x3": 308.86,
"r_y3": 558.68,
"coord_origin": "TOPLEFT"
},
"text": "47% complex). Finally the TableBank dataset consists of",
"orig": "47% complex). Finally the TableBank dataset consists of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 579.54,
"r_x1": 545.12,
"r_y1": 579.54,
"r_x2": 545.12,
"r_y2": 570.64,
"r_x3": 308.86,
"r_y3": 570.64,
"coord_origin": "TOPLEFT"
},
"text": "145k tables provided as JPEG images. The latter has anno-",
"orig": "145k tables provided as JPEG images. The latter has anno-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 591.5,
"r_x1": 545.11,
"r_y1": 591.5,
"r_x2": 545.11,
"r_y2": 582.59,
"r_x3": 308.86,
"r_y3": 582.59,
"coord_origin": "TOPLEFT"
},
"text": "tations for the table structure, but only few with bounding",
"orig": "tations for the table structure, but only few with bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 603.45,
"r_x1": 545.12,
"r_y1": 603.45,
"r_x2": 545.12,
"r_y2": 594.55,
"r_x3": 308.86,
"r_y3": 594.55,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the table cells. The entire dataset consists of sim-",
"orig": "boxes of the table cells. The entire dataset consists of sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 615.41,
"r_x1": 545.12,
"r_y1": 615.41,
"r_x2": 545.12,
"r_y2": 606.5,
"r_x3": 308.86,
"r_y3": 606.5,
"coord_origin": "TOPLEFT"
},
"text": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"orig": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 627.36,
"r_x1": 348.16,
"r_y1": 627.36,
"r_x2": 348.16,
"r_y2": 618.46,
"r_x3": 308.86,
"r_y3": 618.46,
"coord_origin": "TOPLEFT"
},
"text": "Val splits.",
"orig": "Val splits.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The PubTabNet dataset contains 509k tables delivered as annotated PNG images. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as \"simple\" when it does not contain row spans or column spans, otherwise it is \"complex\". The dataset is divided into Train and Val splits (roughly 98% and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDF documents with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits."
},
{
"label": "text",
"id": 4,
"page_no": 2,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.86,
"t": 632.51,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 641.42,
"r_x1": 545.11,
"r_y1": 641.42,
"r_x2": 545.11,
"r_y2": 632.51,
"r_x3": 320.82,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "Due to the heterogeneity across the dataset formats, it",
"orig": "Due to the heterogeneity across the dataset formats, it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.38,
"r_x1": 545.12,
"r_y1": 653.38,
"r_x2": 545.12,
"r_y2": 644.47,
"r_x3": 308.86,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "was necessary to combine all available data into one homog-",
"orig": "was necessary to combine all available data into one homog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.33,
"r_x1": 545.12,
"r_y1": 665.33,
"r_x2": 545.12,
"r_y2": 656.42,
"r_x3": 308.86,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "enized dataset before we could train our models for practi-",
"orig": "enized dataset before we could train our models for practi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "cal purposes. Given the size of PubTabNet, we adopted its",
"orig": "cal purposes. Given the size of PubTabNet, we adopted its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "annotation format and we extracted and converted all tables",
"orig": "annotation format and we extracted and converted all tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "as PNG images with a resolution of 72 dpi. Additionally,",
"orig": "as PNG images with a resolution of 72 dpi. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "we have filtered out tables with extreme sizes due to small",
"orig": "we have filtered out tables with extreme sizes due to small",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small"
}
],
"headers": [
{
"label": "page_footer",
"id": 11,
"page_no": 2,
"cluster": {
"id": 11,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3"
}
]
}
},
{
"page_no": 3,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "amount of such tables, and kept only those ones ranging",
"orig": "amount of such tables, and kept only those ones ranging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 212.28,
"r_y1": 96.07,
"r_x2": 212.28,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "between 1*1 and 20*10 (rows/columns).",
"orig": "between 1*1 and 20*10 (rows/columns).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 109.87,
"r_x1": 286.37,
"r_y1": 109.87,
"r_x2": 286.37,
"r_y2": 100.96,
"r_x3": 62.07,
"r_y3": 100.96,
"coord_origin": "TOPLEFT"
},
"text": "The availability of the bounding boxes for all table cells",
"orig": "The availability of the bounding boxes for all table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 121.82,
"r_x1": 286.37,
"r_y1": 121.82,
"r_x2": 286.37,
"r_y2": 112.92,
"r_x3": 50.11,
"r_y3": 112.92,
"coord_origin": "TOPLEFT"
},
"text": "is essential to train our models. In order to distinguish be-",
"orig": "is essential to train our models. In order to distinguish be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 133.78,
"r_x1": 286.37,
"r_y1": 133.78,
"r_x2": 286.37,
"r_y2": 124.87,
"r_x3": 50.11,
"r_y3": 124.87,
"coord_origin": "TOPLEFT"
},
"text": "tween empty and non-empty bounding boxes, we have in-",
"orig": "tween empty and non-empty bounding boxes, we have in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 145.73,
"r_x1": 286.37,
"r_y1": 145.73,
"r_x2": 286.37,
"r_y2": 136.83,
"r_x3": 50.11,
"r_y3": 136.83,
"coord_origin": "TOPLEFT"
},
"text": "troduced a binary class in the annotation. Unfortunately, the",
"orig": "troduced a binary class in the annotation. Unfortunately, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 157.69,
"r_x1": 286.37,
"r_y1": 157.69,
"r_x2": 286.37,
"r_y2": 148.78,
"r_x3": 50.11,
"r_y3": 148.78,
"coord_origin": "TOPLEFT"
},
"text": "original datasets either omit the bounding boxes for whole",
"orig": "original datasets either omit the bounding boxes for whole",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 169.64,
"r_x1": 286.37,
"r_y1": 169.64,
"r_x2": 286.37,
"r_y2": 160.74,
"r_x3": 50.11,
"r_y3": 160.74,
"coord_origin": "TOPLEFT"
},
"text": "tables (e.g. TableBank) or they narrow their scope only to",
"orig": "tables (e.g. TableBank) or they narrow their scope only to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 181.6,
"r_x1": 286.37,
"r_y1": 181.6,
"r_x2": 286.37,
"r_y2": 172.69,
"r_x3": 50.11,
"r_y3": 172.69,
"coord_origin": "TOPLEFT"
},
"text": "non-empty cells. Therefore, it was imperative to introduce",
"orig": "non-empty cells. Therefore, it was imperative to introduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 193.55,
"r_x1": 286.37,
"r_y1": 193.55,
"r_x2": 286.37,
"r_y2": 184.65,
"r_x3": 50.11,
"r_y3": 184.65,
"coord_origin": "TOPLEFT"
},
"text": "a data pre-processing procedure that generates the missing",
"orig": "a data pre-processing procedure that generates the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 205.51,
"r_x1": 286.37,
"r_y1": 205.51,
"r_x2": 286.37,
"r_y2": 196.6,
"r_x3": 50.11,
"r_y3": 196.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes out of the annotation information. This pro-",
"orig": "bounding boxes out of the annotation information. This pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 217.46,
"r_x1": 286.37,
"r_y1": 217.46,
"r_x2": 286.37,
"r_y2": 208.56,
"r_x3": 50.11,
"r_y3": 208.56,
"coord_origin": "TOPLEFT"
},
"text": "cedure first parses the provided table structure and calcu-",
"orig": "cedure first parses the provided table structure and calcu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 229.42,
"r_x1": 286.37,
"r_y1": 229.42,
"r_x2": 286.37,
"r_y2": 220.51,
"r_x3": 50.11,
"r_y3": 220.51,
"coord_origin": "TOPLEFT"
},
"text": "lates the dimensions of the most fine-grained grid that cov-",
"orig": "lates the dimensions of the most fine-grained grid that cov-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 241.37,
"r_x1": 286.37,
"r_y1": 241.37,
"r_x2": 286.37,
"r_y2": 232.47,
"r_x3": 50.11,
"r_y3": 232.47,
"coord_origin": "TOPLEFT"
},
"text": "ers the table structure. Notice that each table cell may oc-",
"orig": "ers the table structure. Notice that each table cell may oc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 253.33,
"r_x1": 286.37,
"r_y1": 253.33,
"r_x2": 286.37,
"r_y2": 244.42,
"r_x3": 50.11,
"r_y3": 244.42,
"coord_origin": "TOPLEFT"
},
"text": "cupy multiple grid squares due to row or column spans. In",
"orig": "cupy multiple grid squares due to row or column spans. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 265.28,
"r_x1": 286.37,
"r_y1": 265.28,
"r_x2": 286.37,
"r_y2": 256.38,
"r_x3": 50.11,
"r_y3": 256.38,
"coord_origin": "TOPLEFT"
},
"text": "case of PubTabNet we had to compute missing bounding",
"orig": "case of PubTabNet we had to compute missing bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 277.24,
"r_x1": 286.37,
"r_y1": 277.24,
"r_x2": 286.37,
"r_y2": 268.33,
"r_x3": 50.11,
"r_y3": 268.33,
"coord_origin": "TOPLEFT"
},
"text": "boxes for 48% of the simple and 69% of the complex ta-",
"orig": "boxes for 48% of the simple and 69% of the complex ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 289.2,
"r_x1": 68.65,
"r_y1": 289.2,
"r_x2": 68.65,
"r_y2": 280.29,
"r_x3": 50.11,
"r_y3": 280.29,
"coord_origin": "TOPLEFT"
},
"text": "bles.",
"orig": "bles.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.57,
"r_y0": 289.2,
"r_x1": 286.37,
"r_y1": 289.2,
"r_x2": 286.37,
"r_y2": 280.29,
"r_x3": 75.57,
"r_y3": 280.29,
"coord_origin": "TOPLEFT"
},
"text": "Regarding FinTabNet, 68% of the simple and 98%",
"orig": "Regarding FinTabNet, 68% of the simple and 98%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 301.15,
"r_x1": 286.37,
"r_y1": 301.15,
"r_x2": 286.37,
"r_y2": 292.24,
"r_x3": 50.11,
"r_y3": 292.24,
"coord_origin": "TOPLEFT"
},
"text": "of the complex tables require the generation of bounding",
"orig": "of the complex tables require the generation of bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 313.11,
"r_x1": 75.7,
"r_y1": 313.11,
"r_x2": 75.7,
"r_y2": 304.2,
"r_x3": 50.11,
"r_y3": 304.2,
"coord_origin": "TOPLEFT"
},
"text": "boxes.",
"orig": "boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 326.9,
"r_x1": 286.36,
"r_y1": 326.9,
"r_x2": 286.36,
"r_y2": 318.0,
"r_x3": 62.07,
"r_y3": 318.0,
"coord_origin": "TOPLEFT"
},
"text": "As it is illustrated in Fig. 2, the table distributions from",
"orig": "As it is illustrated in Fig. 2, the table distributions from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 338.86,
"r_x1": 286.37,
"r_y1": 338.86,
"r_x2": 286.37,
"r_y2": 329.95,
"r_x3": 50.11,
"r_y3": 329.95,
"coord_origin": "TOPLEFT"
},
"text": "all datasets are skewed towards simpler structures with",
"orig": "all datasets are skewed towards simpler structures with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 350.81,
"r_x1": 286.37,
"r_y1": 350.81,
"r_x2": 286.37,
"r_y2": 341.91,
"r_x3": 50.11,
"r_y3": 341.91,
"coord_origin": "TOPLEFT"
},
"text": "fewer number of rows/columns. Additionally, there is very",
"orig": "fewer number of rows/columns. Additionally, there is very",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 362.77,
"r_x1": 286.37,
"r_y1": 362.77,
"r_x2": 286.37,
"r_y2": 353.86,
"r_x3": 50.11,
"r_y3": 353.86,
"coord_origin": "TOPLEFT"
},
"text": "limited variance in the table styles, which in case of Pub-",
"orig": "limited variance in the table styles, which in case of Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 374.72,
"r_x1": 286.37,
"r_y1": 374.72,
"r_x2": 286.37,
"r_y2": 365.82,
"r_x3": 50.11,
"r_y3": 365.82,
"coord_origin": "TOPLEFT"
},
"text": "TabNet and FinTabNet means one styling format for the",
"orig": "TabNet and FinTabNet means one styling format for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 386.68,
"r_x1": 141.59,
"r_y1": 386.68,
"r_x2": 141.59,
"r_y2": 377.77,
"r_x3": 50.11,
"r_y3": 377.77,
"coord_origin": "TOPLEFT"
},
"text": "majority of the tables.",
"orig": "majority of the tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 148.7,
"r_y0": 386.68,
"r_x1": 286.37,
"r_y1": 386.68,
"r_x2": 286.37,
"r_y2": 377.77,
"r_x3": 148.7,
"r_y3": 377.77,
"coord_origin": "TOPLEFT"
},
"text": "Similar limitations appear also in",
"orig": "Similar limitations appear also in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 398.63,
"r_x1": 286.37,
"r_y1": 398.63,
"r_x2": 286.37,
"r_y2": 389.73,
"r_x3": 50.11,
"r_y3": 389.73,
"coord_origin": "TOPLEFT"
},
"text": "the type of table content, which in some cases (e.g. FinTab-",
"orig": "the type of table content, which in some cases (e.g. FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 410.59,
"r_x1": 286.37,
"r_y1": 410.59,
"r_x2": 286.37,
"r_y2": 401.68,
"r_x3": 50.11,
"r_y3": 401.68,
"coord_origin": "TOPLEFT"
},
"text": "Net) is restricted to a certain domain. Ultimately, the lack",
"orig": "Net) is restricted to a certain domain. Ultimately, the lack",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 422.54,
"r_x1": 286.37,
"r_y1": 422.54,
"r_x2": 286.37,
"r_y2": 413.64,
"r_x3": 50.11,
"r_y3": 413.64,
"coord_origin": "TOPLEFT"
},
"text": "of diversity in the training dataset damages the ability of the",
"orig": "of diversity in the training dataset damages the ability of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 434.5,
"r_x1": 216.4,
"r_y1": 434.5,
"r_x2": 216.4,
"r_y2": 425.59,
"r_x3": 50.11,
"r_y3": 425.59,
"coord_origin": "TOPLEFT"
},
"text": "models to generalize well on unseen data.",
"orig": "models to generalize well on unseen data.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 448.3,
"r_x1": 286.36,
"r_y1": 448.3,
"r_x2": 286.36,
"r_y2": 439.39,
"r_x3": 62.07,
"r_y3": 439.39,
"coord_origin": "TOPLEFT"
},
"text": "Motivated by those observations we aimed at generating",
"orig": "Motivated by those observations we aimed at generating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 460.25,
"r_x1": 172.14,
"r_y1": 460.25,
"r_x2": 172.14,
"r_y2": 451.34,
"r_x3": 50.11,
"r_y3": 451.34,
"coord_origin": "TOPLEFT"
},
"text": "a synthetic table dataset named",
"orig": "a synthetic table dataset named",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.15,
"r_y0": 460.02,
"r_x1": 224.71,
"r_y1": 460.02,
"r_x2": 224.71,
"r_y2": 451.43,
"r_x3": 174.15,
"r_y3": 451.43,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.71,
"r_y0": 460.25,
"r_x1": 286.37,
"r_y1": 460.25,
"r_x2": 286.37,
"r_y2": 451.34,
"r_x3": 224.71,
"r_y3": 451.34,
"coord_origin": "TOPLEFT"
},
"text": ". This approach",
"orig": ". This approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 472.21,
"r_x1": 286.37,
"r_y1": 472.21,
"r_x2": 286.37,
"r_y2": 463.3,
"r_x3": 50.11,
"r_y3": 463.3,
"coord_origin": "TOPLEFT"
},
"text": "offers control over: 1) the size of the dataset, 2) the table",
"orig": "offers control over: 1) the size of the dataset, 2) the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 484.16,
"r_x1": 286.37,
"r_y1": 484.16,
"r_x2": 286.37,
"r_y2": 475.26,
"r_x3": 50.11,
"r_y3": 475.26,
"coord_origin": "TOPLEFT"
},
"text": "structure, 3) the table style and 4) the type of content. The",
"orig": "structure, 3) the table style and 4) the type of content. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 496.12,
"r_x1": 286.37,
"r_y1": 496.12,
"r_x2": 286.37,
"r_y2": 487.21,
"r_x3": 50.11,
"r_y3": 487.21,
"coord_origin": "TOPLEFT"
},
"text": "complexity of the table structure is described by the size of",
"orig": "complexity of the table structure is described by the size of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 508.07,
"r_x1": 286.37,
"r_y1": 508.07,
"r_x2": 286.37,
"r_y2": 499.17,
"r_x3": 50.11,
"r_y3": 499.17,
"coord_origin": "TOPLEFT"
},
"text": "the table header and the table body, as well as the percentage",
"orig": "the table header and the table body, as well as the percentage",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 520.03,
"r_x1": 286.37,
"r_y1": 520.03,
"r_x2": 286.37,
"r_y2": 511.12,
"r_x3": 50.11,
"r_y3": 511.12,
"coord_origin": "TOPLEFT"
},
"text": "of the table cells covered by row spans and column spans.",
"orig": "of the table cells covered by row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 531.98,
"r_x1": 286.37,
"r_y1": 531.98,
"r_x2": 286.37,
"r_y2": 523.08,
"r_x3": 50.11,
"r_y3": 523.08,
"coord_origin": "TOPLEFT"
},
"text": "A set of carefully designed styling templates provides the",
"orig": "A set of carefully designed styling templates provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 543.94,
"r_x1": 286.37,
"r_y1": 543.94,
"r_x2": 286.37,
"r_y2": 535.03,
"r_x3": 50.11,
"r_y3": 535.03,
"coord_origin": "TOPLEFT"
},
"text": "basis to build a wide range of table appearances. Lastly, the",
"orig": "basis to build a wide range of table appearances. Lastly, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 555.89,
"r_x1": 286.37,
"r_y1": 555.89,
"r_x2": 286.37,
"r_y2": 546.99,
"r_x3": 50.11,
"r_y3": 546.99,
"coord_origin": "TOPLEFT"
},
"text": "table content is generated out of a curated collection of text",
"orig": "table content is generated out of a curated collection of text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 567.85,
"r_x1": 286.37,
"r_y1": 567.85,
"r_x2": 286.37,
"r_y2": 558.94,
"r_x3": 50.11,
"r_y3": 558.94,
"coord_origin": "TOPLEFT"
},
"text": "corpora. By controlling the size and scope of the synthetic",
"orig": "corpora. By controlling the size and scope of the synthetic",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 579.8,
"r_x1": 286.37,
"r_y1": 579.8,
"r_x2": 286.37,
"r_y2": 570.9,
"r_x3": 50.11,
"r_y3": 570.9,
"coord_origin": "TOPLEFT"
},
"text": "datasets we are able to train and evaluate our models in a",
"orig": "datasets we are able to train and evaluate our models in a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 591.76,
"r_x1": 286.37,
"r_y1": 591.76,
"r_x2": 286.37,
"r_y2": 582.85,
"r_x3": 50.11,
"r_y3": 582.85,
"coord_origin": "TOPLEFT"
},
"text": "variety of different conditions. For example, we can first",
"orig": "variety of different conditions. For example, we can first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 603.71,
"r_x1": 286.37,
"r_y1": 603.71,
"r_x2": 286.37,
"r_y2": 594.81,
"r_x3": 50.11,
"r_y3": 594.81,
"coord_origin": "TOPLEFT"
},
"text": "generate a highly diverse dataset to train our models and",
"orig": "generate a highly diverse dataset to train our models and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 615.67,
"r_x1": 286.37,
"r_y1": 615.67,
"r_x2": 286.37,
"r_y2": 606.76,
"r_x3": 50.11,
"r_y3": 606.76,
"coord_origin": "TOPLEFT"
},
"text": "then evaluate their performance on other synthetic datasets",
"orig": "then evaluate their performance on other synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 627.62,
"r_x1": 209.75,
"r_y1": 627.62,
"r_x2": 209.75,
"r_y2": 618.72,
"r_x3": 50.11,
"r_y3": 618.72,
"coord_origin": "TOPLEFT"
},
"text": "which are focused on a specific domain.",
"orig": "which are focused on a specific domain.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 641.42,
"r_x1": 286.36,
"r_y1": 641.42,
"r_x2": 286.36,
"r_y2": 632.51,
"r_x3": 62.07,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "In this regard, we have prepared four synthetic datasets,",
"orig": "In this regard, we have prepared four synthetic datasets,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "each one containing 150k examples. The corpora to gener-",
"orig": "each one containing 150k examples. The corpora to gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.43,
"r_x3": 50.11,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "ate the table text consists of the most frequent terms appear-",
"orig": "ate the table text consists of the most frequent terms appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "ing in PubTabNet and FinTabNet together with randomly",
"orig": "ing in PubTabNet and FinTabNet together with randomly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "generated text. The first two synthetic datasets have been",
"orig": "generated text. The first two synthetic datasets have been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "fine-tuned to mimic the appearance of the original datasets",
"orig": "fine-tuned to mimic the appearance of the original datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "but encompass more complicated table structures. The third",
"orig": "but encompass more complicated table structures. The third",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 176.57,
"r_x1": 344.62,
"r_y1": 176.57,
"r_x2": 344.62,
"r_y2": 167.66,
"r_x3": 308.86,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "Table 1:",
"orig": "Table 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 361.08,
"r_y0": 176.57,
"r_x1": 380.45,
"r_y1": 176.57,
"r_x2": 380.45,
"r_y2": 167.66,
"r_x3": 361.08,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "Both",
"orig": "Both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.57,
"r_y0": 176.34,
"r_x1": 468.68,
"r_y1": 176.34,
"r_x2": 468.68,
"r_y2": 167.75,
"r_x3": 386.57,
"r_y3": 167.75,
"coord_origin": "TOPLEFT"
},
"text": "\u201cCombined-Tabnet\u201d",
"orig": "\u201cCombined-Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 176.57,
"r_x1": 489.18,
"r_y1": 176.57,
"r_x2": 489.18,
"r_y2": 167.66,
"r_x3": 474.8,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.3,
"r_y0": 176.34,
"r_x1": 545.11,
"r_y1": 176.34,
"r_x2": 545.11,
"r_y2": 167.75,
"r_x3": 495.3,
"r_y3": 167.75,
"coord_origin": "TOPLEFT"
},
"text": "\u201dCombined-",
"orig": "\u201dCombined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 188.29,
"r_x1": 341.16,
"r_y1": 188.29,
"r_x2": 341.16,
"r_y2": 179.71,
"r_x3": 308.86,
"r_y3": 179.71,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet\u201d",
"orig": "Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.46,
"r_y0": 188.52,
"r_x1": 545.11,
"r_y1": 188.52,
"r_x2": 545.11,
"r_y2": 179.62,
"r_x3": 343.46,
"r_y3": 179.62,
"coord_origin": "TOPLEFT"
},
"text": "are variations of the following: (*) The Combined-",
"orig": "are variations of the following: (*) The Combined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 200.48,
"r_x1": 545.12,
"r_y1": 200.48,
"r_x2": 545.12,
"r_y2": 191.57,
"r_x3": 308.86,
"r_y3": 191.57,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet dataset is the processed combination of PubTabNet",
"orig": "Tabnet dataset is the processed combination of PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 212.43,
"r_x1": 545.11,
"r_y1": 212.43,
"r_x2": 545.11,
"r_y2": 203.53,
"r_x3": 308.86,
"r_y3": 203.53,
"coord_origin": "TOPLEFT"
},
"text": "and Fintabnet. (**) The combined dataset is the processed",
"orig": "and Fintabnet. (**) The combined dataset is the processed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 224.39,
"r_x1": 523.93,
"r_y1": 224.39,
"r_x2": 523.93,
"r_y2": 215.48,
"r_x3": 308.86,
"r_y3": 215.48,
"coord_origin": "TOPLEFT"
},
"text": "combination of PubTabNet, Fintabnet and TableBank.",
"orig": "combination of PubTabNet, Fintabnet and TableBank.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.53,
"r_x1": 545.12,
"r_y1": 258.53,
"r_x2": 545.12,
"r_y2": 249.62,
"r_x3": 308.86,
"r_y3": 249.62,
"coord_origin": "TOPLEFT"
},
"text": "one adopts a colorful appearance with high contrast and the",
"orig": "one adopts a colorful appearance with high contrast and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.48,
"r_x1": 545.12,
"r_y1": 270.48,
"r_x2": 545.12,
"r_y2": 261.58,
"r_x3": 308.86,
"r_y3": 261.58,
"coord_origin": "TOPLEFT"
},
"text": "last one contains tables with sparse content. Lastly, we have",
"orig": "last one contains tables with sparse content. Lastly, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.44,
"r_x1": 545.12,
"r_y1": 282.44,
"r_x2": 545.12,
"r_y2": 273.53,
"r_x3": 308.86,
"r_y3": 273.53,
"coord_origin": "TOPLEFT"
},
"text": "combined all synthetic datasets into one big unified syn-",
"orig": "combined all synthetic datasets into one big unified syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.39,
"r_x1": 436.82,
"r_y1": 294.39,
"r_x2": 436.82,
"r_y2": 285.49,
"r_x3": 308.86,
"r_y3": 285.49,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset of 600k examples.",
"orig": "thetic dataset of 600k examples.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 306.68,
"r_x1": 542.74,
"r_y1": 306.68,
"r_x2": 542.74,
"r_y2": 297.77,
"r_x3": 320.82,
"r_y3": 297.77,
"coord_origin": "TOPLEFT"
},
"text": "Tab. 1 summarizes the various attributes of the datasets.",
"orig": "Tab. 1 summarizes the various attributes of the datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 331.93,
"r_x1": 316.28,
"r_y1": 331.93,
"r_x2": 316.28,
"r_y2": 321.18,
"r_x3": 308.86,
"r_y3": 321.18,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.18,
"r_y0": 331.93,
"r_x1": 444.94,
"r_y1": 331.93,
"r_x2": 444.94,
"r_y2": 321.18,
"r_x3": 326.18,
"r_y3": 321.18,
"coord_origin": "TOPLEFT"
},
"text": "The TableFormer model",
"orig": "The TableFormer model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 350.85,
"r_x1": 545.11,
"r_y1": 350.85,
"r_x2": 545.11,
"r_y2": 341.94,
"r_x3": 320.82,
"r_y3": 341.94,
"coord_origin": "TOPLEFT"
},
"text": "Given the image of a table, TableFormer is able to pre-",
"orig": "Given the image of a table, TableFormer is able to pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 362.8,
"r_x1": 545.12,
"r_y1": 362.8,
"r_x2": 545.12,
"r_y2": 353.89,
"r_x3": 308.86,
"r_y3": 353.89,
"coord_origin": "TOPLEFT"
},
"text": "dict: 1) a sequence of tokens that represent the structure of",
"orig": "dict: 1) a sequence of tokens that represent the structure of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 374.76,
"r_x1": 545.12,
"r_y1": 374.76,
"r_x2": 545.12,
"r_y2": 365.85,
"r_x3": 308.86,
"r_y3": 365.85,
"coord_origin": "TOPLEFT"
},
"text": "a table, and 2) a bounding box coupled to a subset of those",
"orig": "a table, and 2) a bounding box coupled to a subset of those",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 386.71,
"r_x1": 545.12,
"r_y1": 386.71,
"r_x2": 545.12,
"r_y2": 377.8,
"r_x3": 308.86,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "tokens. The conversion of an image into a sequence of to-",
"orig": "tokens. The conversion of an image into a sequence of to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 398.67,
"r_x1": 545.12,
"r_y1": 398.67,
"r_x2": 545.12,
"r_y2": 389.76,
"r_x3": 308.86,
"r_y3": 389.76,
"coord_origin": "TOPLEFT"
},
"text": "kens is a well-known task [35, 16]. While attention is often",
"orig": "kens is a well-known task [35, 16]. While attention is often",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 410.62,
"r_x1": 545.12,
"r_y1": 410.62,
"r_x2": 545.12,
"r_y2": 401.71,
"r_x3": 308.86,
"r_y3": 401.71,
"coord_origin": "TOPLEFT"
},
"text": "used as an implicit method to associate each token of the",
"orig": "used as an implicit method to associate each token of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 422.58,
"r_x1": 545.12,
"r_y1": 422.58,
"r_x2": 545.12,
"r_y2": 413.67,
"r_x3": 308.86,
"r_y3": 413.67,
"coord_origin": "TOPLEFT"
},
"text": "sequence with a position in the original image, an explicit",
"orig": "sequence with a position in the original image, an explicit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 434.53,
"r_x1": 545.12,
"r_y1": 434.53,
"r_x2": 545.12,
"r_y2": 425.63,
"r_x3": 308.86,
"r_y3": 425.63,
"coord_origin": "TOPLEFT"
},
"text": "association between the individual table-cells and the image",
"orig": "association between the individual table-cells and the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 446.49,
"r_x1": 437.94,
"r_y1": 446.49,
"r_x2": 437.94,
"r_y2": 437.58,
"r_x3": 308.86,
"r_y3": 437.58,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes is also required.",
"orig": "bounding boxes is also required.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 467.55,
"r_x1": 323.14,
"r_y1": 467.55,
"r_x2": 323.14,
"r_y2": 457.69,
"r_x3": 308.86,
"r_y3": 457.69,
"coord_origin": "TOPLEFT"
},
"text": "4.1.",
"orig": "4.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 332.66,
"r_y0": 467.55,
"r_x1": 420.16,
"r_y1": 467.55,
"r_x2": 420.16,
"r_y2": 457.69,
"r_x3": 332.66,
"r_y3": 457.69,
"coord_origin": "TOPLEFT"
},
"text": "Model architecture.",
"orig": "Model architecture.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 485.67,
"r_x1": 545.11,
"r_y1": 485.67,
"r_x2": 545.11,
"r_y2": 476.77,
"r_x3": 320.82,
"r_y3": 476.77,
"coord_origin": "TOPLEFT"
},
"text": "We now describe in detail the proposed method, which",
"orig": "We now describe in detail the proposed method, which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.63,
"r_x1": 509.02,
"r_y1": 497.63,
"r_x2": 509.02,
"r_y2": 488.72,
"r_x3": 308.86,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "is composed of three main components, see Fig.",
"orig": "is composed of three main components, see Fig.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.59,
"r_y0": 497.63,
"r_x1": 523.06,
"r_y1": 497.63,
"r_x2": 523.06,
"r_y2": 488.72,
"r_x3": 515.59,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 497.63,
"r_x1": 545.12,
"r_y1": 497.63,
"r_x2": 545.12,
"r_y2": 488.72,
"r_x3": 529.62,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "Our",
"orig": "Our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.35,
"r_x1": 406.35,
"r_y1": 509.35,
"r_x2": 406.35,
"r_y2": 500.76,
"r_x3": 308.86,
"r_y3": 500.76,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.87,
"r_y0": 509.58,
"r_x1": 545.11,
"r_y1": 509.58,
"r_x2": 545.11,
"r_y2": 500.68,
"r_x3": 408.87,
"r_y3": 500.68,
"coord_origin": "TOPLEFT"
},
"text": "encodes the input as a feature vec-",
"orig": "encodes the input as a feature vec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.54,
"r_x1": 409.39,
"r_y1": 521.54,
"r_x2": 409.39,
"r_y2": 512.63,
"r_x3": 308.86,
"r_y3": 512.63,
"coord_origin": "TOPLEFT"
},
"text": "tor of predefined length.",
"orig": "tor of predefined length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.73,
"r_y0": 521.54,
"r_x1": 545.12,
"r_y1": 521.54,
"r_x2": 545.12,
"r_y2": 512.63,
"r_x3": 416.73,
"r_y3": 512.63,
"coord_origin": "TOPLEFT"
},
"text": "The input feature vector of the",
"orig": "The input feature vector of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.49,
"r_x1": 436.19,
"r_y1": 533.49,
"r_x2": 436.19,
"r_y2": 524.59,
"r_x3": 308.86,
"r_y3": 524.59,
"coord_origin": "TOPLEFT"
},
"text": "encoded image is passed to the",
"orig": "encoded image is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.53,
"r_y0": 533.26,
"r_x1": 513.87,
"r_y1": 533.26,
"r_x2": 513.87,
"r_y2": 524.68,
"r_x3": 439.53,
"r_y3": 524.68,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 517.43,
"r_y0": 533.49,
"r_x1": 545.11,
"r_y1": 533.49,
"r_x2": 545.11,
"r_y2": 524.59,
"r_x3": 517.43,
"r_y3": 524.59,
"coord_origin": "TOPLEFT"
},
"text": "to pro-",
"orig": "to pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.45,
"r_x1": 545.12,
"r_y1": 545.45,
"r_x2": 545.12,
"r_y2": 536.54,
"r_x3": 308.86,
"r_y3": 536.54,
"coord_origin": "TOPLEFT"
},
"text": "duce a sequence of HTML tags that represent the structure",
"orig": "duce a sequence of HTML tags that represent the structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.4,
"r_x1": 358.55,
"r_y1": 557.4,
"r_x2": 358.55,
"r_y2": 548.5,
"r_x3": 308.86,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "of the table.",
"orig": "of the table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.19,
"r_y0": 557.4,
"r_x1": 545.12,
"r_y1": 557.4,
"r_x2": 545.12,
"r_y2": 548.5,
"r_x3": 365.19,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "With each prediction of an HTML standard",
"orig": "With each prediction of an HTML standard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.36,
"r_x1": 352.41,
"r_y1": 569.36,
"r_x2": 352.41,
"r_y2": 560.45,
"r_x3": 308.86,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "data cell (\u2018",
"orig": "data cell (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.41,
"r_y0": 569.14,
"r_x1": 360.16,
"r_y1": 569.14,
"r_x2": 360.16,
"r_y2": 560.29,
"r_x3": 352.41,
"r_y3": 560.29,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.16,
"r_y0": 569.36,
"r_x1": 367.91,
"r_y1": 569.36,
"r_x2": 367.91,
"r_y2": 560.45,
"r_x3": 360.16,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.91,
"r_y0": 569.14,
"r_x1": 375.66,
"r_y1": 569.14,
"r_x2": 375.66,
"r_y2": 560.29,
"r_x3": 367.91,
"r_y3": 560.29,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 375.66,
"r_y0": 569.36,
"r_x1": 545.11,
"r_y1": 569.36,
"r_x2": 545.11,
"r_y2": 560.45,
"r_x3": 375.66,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) the hidden state of that cell is passed to",
"orig": "\u2019) the hidden state of that cell is passed to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.31,
"r_x1": 545.11,
"r_y1": 581.31,
"r_x2": 545.11,
"r_y2": 572.41,
"r_x3": 308.86,
"r_y3": 572.41,
"coord_origin": "TOPLEFT"
},
"text": "the Cell BBox Decoder. As for spanning cells, such as row",
"orig": "the Cell BBox Decoder. As for spanning cells, such as row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.27,
"r_x1": 483.12,
"r_y1": 593.27,
"r_x2": 483.12,
"r_y2": 584.36,
"r_x3": 308.86,
"r_y3": 584.36,
"coord_origin": "TOPLEFT"
},
"text": "or column span, the tag is broken down to \u2018",
"orig": "or column span, the tag is broken down to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.12,
"r_y0": 593.05,
"r_x1": 490.87,
"r_y1": 593.05,
"r_x2": 490.87,
"r_y2": 584.2,
"r_x3": 483.12,
"r_y3": 584.2,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.87,
"r_y0": 593.27,
"r_x1": 545.11,
"r_y1": 593.27,
"r_x2": 545.11,
"r_y2": 584.36,
"r_x3": 490.87,
"r_y3": 584.36,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018rowspan=\u2019",
"orig": "\u2019, \u2018rowspan=\u2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.22,
"r_x1": 545.11,
"r_y1": 605.22,
"r_x2": 545.11,
"r_y2": 596.32,
"r_x3": 308.86,
"r_y3": 596.32,
"coord_origin": "TOPLEFT"
},
"text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.18,
"r_x1": 329.64,
"r_y1": 617.18,
"r_x2": 329.64,
"r_y2": 608.27,
"r_x3": 308.86,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "and \u2018",
"orig": "and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.65,
"r_y0": 616.96,
"r_x1": 337.39,
"r_y1": 616.96,
"r_x2": 337.39,
"r_y2": 608.11,
"r_x3": 329.65,
"r_y3": 608.11,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.39,
"r_y0": 617.18,
"r_x1": 468.59,
"r_y1": 617.18,
"r_x2": 468.59,
"r_y2": 608.27,
"r_x3": 337.39,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "\u2019. The hidden state attached to \u2018",
"orig": "\u2019. The hidden state attached to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.59,
"r_y0": 616.96,
"r_x1": 476.34,
"r_y1": 616.96,
"r_x2": 476.34,
"r_y2": 608.11,
"r_x3": 468.59,
"r_y3": 608.11,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.34,
"r_y0": 617.18,
"r_x1": 545.12,
"r_y1": 617.18,
"r_x2": 545.12,
"r_y2": 608.27,
"r_x3": 476.34,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 is passed to the",
"orig": "\u2019 is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.13,
"r_x1": 545.11,
"r_y1": 629.13,
"r_x2": 545.11,
"r_y2": 620.23,
"r_x3": 308.86,
"r_y3": 620.23,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder. A shared feed forward network (FFN)",
"orig": "Cell BBox Decoder. A shared feed forward network (FFN)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.09,
"r_x1": 545.12,
"r_y1": 641.09,
"r_x2": 545.12,
"r_y2": 632.18,
"r_x3": 308.86,
"r_y3": 632.18,
"coord_origin": "TOPLEFT"
},
"text": "receives the hidden states from the Structure Decoder, to",
"orig": "receives the hidden states from the Structure Decoder, to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.04,
"r_x1": 545.12,
"r_y1": 653.04,
"r_x2": 545.12,
"r_y2": 644.14,
"r_x3": 308.86,
"r_y3": 644.14,
"coord_origin": "TOPLEFT"
},
"text": "provide the final detection predictions of the bounding box",
"orig": "provide the final detection predictions of the bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.0,
"r_x1": 449.42,
"r_y1": 665.0,
"r_x2": 449.42,
"r_y2": 656.09,
"r_x3": 308.86,
"r_y3": 656.09,
"coord_origin": "TOPLEFT"
},
"text": "coordinates and their classification.",
"orig": "coordinates and their classification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 677.22,
"r_x1": 431.91,
"r_y1": 677.22,
"r_x2": 431.91,
"r_y2": 668.26,
"r_x3": 320.82,
"r_y3": 668.26,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network.",
"orig": "CNN Backbone Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 439.5,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "A ResNet-18 CNN is the",
"orig": "A ResNet-18 CNN is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.11,
"r_y1": 689.24,
"r_x2": 545.11,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "backbone that receives the table image and encodes it as a",
"orig": "backbone that receives the table image and encodes it as a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "vector of predefined length. The network has been modified",
"orig": "vector of predefined length. The network has been modified",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "by removing the linear and pooling layer, as we are not per-",
"orig": "by removing the linear and pooling layer, as we are not per-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 96.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.961,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "amount of such tables, and kept only those ones ranging",
"orig": "amount of such tables, and kept only those ones ranging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 212.28,
"r_y1": 96.07,
"r_x2": 212.28,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "between 1*1 and 20*10 (rows/columns).",
"orig": "between 1*1 and 20*10 (rows/columns).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 100.96,
"r": 286.37,
"b": 313.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 109.87,
"r_x1": 286.37,
"r_y1": 109.87,
"r_x2": 286.37,
"r_y2": 100.96,
"r_x3": 62.07,
"r_y3": 100.96,
"coord_origin": "TOPLEFT"
},
"text": "The availability of the bounding boxes for all table cells",
"orig": "The availability of the bounding boxes for all table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 121.82,
"r_x1": 286.37,
"r_y1": 121.82,
"r_x2": 286.37,
"r_y2": 112.92,
"r_x3": 50.11,
"r_y3": 112.92,
"coord_origin": "TOPLEFT"
},
"text": "is essential to train our models. In order to distinguish be-",
"orig": "is essential to train our models. In order to distinguish be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 133.78,
"r_x1": 286.37,
"r_y1": 133.78,
"r_x2": 286.37,
"r_y2": 124.87,
"r_x3": 50.11,
"r_y3": 124.87,
"coord_origin": "TOPLEFT"
},
"text": "tween empty and non-empty bounding boxes, we have in-",
"orig": "tween empty and non-empty bounding boxes, we have in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 145.73,
"r_x1": 286.37,
"r_y1": 145.73,
"r_x2": 286.37,
"r_y2": 136.83,
"r_x3": 50.11,
"r_y3": 136.83,
"coord_origin": "TOPLEFT"
},
"text": "troduced a binary class in the annotation. Unfortunately, the",
"orig": "troduced a binary class in the annotation. Unfortunately, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 157.69,
"r_x1": 286.37,
"r_y1": 157.69,
"r_x2": 286.37,
"r_y2": 148.78,
"r_x3": 50.11,
"r_y3": 148.78,
"coord_origin": "TOPLEFT"
},
"text": "original datasets either omit the bounding boxes for whole",
"orig": "original datasets either omit the bounding boxes for whole",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 169.64,
"r_x1": 286.37,
"r_y1": 169.64,
"r_x2": 286.37,
"r_y2": 160.74,
"r_x3": 50.11,
"r_y3": 160.74,
"coord_origin": "TOPLEFT"
},
"text": "tables (e.g. TableBank) or they narrow their scope only to",
"orig": "tables (e.g. TableBank) or they narrow their scope only to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 181.6,
"r_x1": 286.37,
"r_y1": 181.6,
"r_x2": 286.37,
"r_y2": 172.69,
"r_x3": 50.11,
"r_y3": 172.69,
"coord_origin": "TOPLEFT"
},
"text": "non-empty cells. Therefore, it was imperative to introduce",
"orig": "non-empty cells. Therefore, it was imperative to introduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 193.55,
"r_x1": 286.37,
"r_y1": 193.55,
"r_x2": 286.37,
"r_y2": 184.65,
"r_x3": 50.11,
"r_y3": 184.65,
"coord_origin": "TOPLEFT"
},
"text": "a data pre-processing procedure that generates the missing",
"orig": "a data pre-processing procedure that generates the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 205.51,
"r_x1": 286.37,
"r_y1": 205.51,
"r_x2": 286.37,
"r_y2": 196.6,
"r_x3": 50.11,
"r_y3": 196.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes out of the annotation information. This pro-",
"orig": "bounding boxes out of the annotation information. This pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 217.46,
"r_x1": 286.37,
"r_y1": 217.46,
"r_x2": 286.37,
"r_y2": 208.56,
"r_x3": 50.11,
"r_y3": 208.56,
"coord_origin": "TOPLEFT"
},
"text": "cedure first parses the provided table structure and calcu-",
"orig": "cedure first parses the provided table structure and calcu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 229.42,
"r_x1": 286.37,
"r_y1": 229.42,
"r_x2": 286.37,
"r_y2": 220.51,
"r_x3": 50.11,
"r_y3": 220.51,
"coord_origin": "TOPLEFT"
},
"text": "lates the dimensions of the most fine-grained grid that cov-",
"orig": "lates the dimensions of the most fine-grained grid that cov-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 241.37,
"r_x1": 286.37,
"r_y1": 241.37,
"r_x2": 286.37,
"r_y2": 232.47,
"r_x3": 50.11,
"r_y3": 232.47,
"coord_origin": "TOPLEFT"
},
"text": "ers the table structure. Notice that each table cell may oc-",
"orig": "ers the table structure. Notice that each table cell may oc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 253.33,
"r_x1": 286.37,
"r_y1": 253.33,
"r_x2": 286.37,
"r_y2": 244.42,
"r_x3": 50.11,
"r_y3": 244.42,
"coord_origin": "TOPLEFT"
},
"text": "cupy multiple grid squares due to row or column spans. In",
"orig": "cupy multiple grid squares due to row or column spans. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 265.28,
"r_x1": 286.37,
"r_y1": 265.28,
"r_x2": 286.37,
"r_y2": 256.38,
"r_x3": 50.11,
"r_y3": 256.38,
"coord_origin": "TOPLEFT"
},
"text": "case of PubTabNet we had to compute missing bounding",
"orig": "case of PubTabNet we had to compute missing bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 277.24,
"r_x1": 286.37,
"r_y1": 277.24,
"r_x2": 286.37,
"r_y2": 268.33,
"r_x3": 50.11,
"r_y3": 268.33,
"coord_origin": "TOPLEFT"
},
"text": "boxes for 48% of the simple and 69% of the complex ta-",
"orig": "boxes for 48% of the simple and 69% of the complex ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 289.2,
"r_x1": 68.65,
"r_y1": 289.2,
"r_x2": 68.65,
"r_y2": 280.29,
"r_x3": 50.11,
"r_y3": 280.29,
"coord_origin": "TOPLEFT"
},
"text": "bles.",
"orig": "bles.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.57,
"r_y0": 289.2,
"r_x1": 286.37,
"r_y1": 289.2,
"r_x2": 286.37,
"r_y2": 280.29,
"r_x3": 75.57,
"r_y3": 280.29,
"coord_origin": "TOPLEFT"
},
"text": "Regarding FinTabNet, 68% of the simple and 98%",
"orig": "Regarding FinTabNet, 68% of the simple and 98%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 301.15,
"r_x1": 286.37,
"r_y1": 301.15,
"r_x2": 286.37,
"r_y2": 292.24,
"r_x3": 50.11,
"r_y3": 292.24,
"coord_origin": "TOPLEFT"
},
"text": "of the complex tables require the generation of bounding",
"orig": "of the complex tables require the generation of bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 313.11,
"r_x1": 75.7,
"r_y1": 313.11,
"r_x2": 75.7,
"r_y2": 304.2,
"r_x3": 50.11,
"r_y3": 304.2,
"coord_origin": "TOPLEFT"
},
"text": "boxes.",
"orig": "boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 318.0,
"r": 286.37,
"b": 434.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 326.9,
"r_x1": 286.36,
"r_y1": 326.9,
"r_x2": 286.36,
"r_y2": 318.0,
"r_x3": 62.07,
"r_y3": 318.0,
"coord_origin": "TOPLEFT"
},
"text": "As it is illustrated in Fig. 2, the table distributions from",
"orig": "As it is illustrated in Fig. 2, the table distributions from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 338.86,
"r_x1": 286.37,
"r_y1": 338.86,
"r_x2": 286.37,
"r_y2": 329.95,
"r_x3": 50.11,
"r_y3": 329.95,
"coord_origin": "TOPLEFT"
},
"text": "all datasets are skewed towards simpler structures with",
"orig": "all datasets are skewed towards simpler structures with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 350.81,
"r_x1": 286.37,
"r_y1": 350.81,
"r_x2": 286.37,
"r_y2": 341.91,
"r_x3": 50.11,
"r_y3": 341.91,
"coord_origin": "TOPLEFT"
},
"text": "fewer number of rows/columns. Additionally, there is very",
"orig": "fewer number of rows/columns. Additionally, there is very",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 362.77,
"r_x1": 286.37,
"r_y1": 362.77,
"r_x2": 286.37,
"r_y2": 353.86,
"r_x3": 50.11,
"r_y3": 353.86,
"coord_origin": "TOPLEFT"
},
"text": "limited variance in the table styles, which in case of Pub-",
"orig": "limited variance in the table styles, which in case of Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 374.72,
"r_x1": 286.37,
"r_y1": 374.72,
"r_x2": 286.37,
"r_y2": 365.82,
"r_x3": 50.11,
"r_y3": 365.82,
"coord_origin": "TOPLEFT"
},
"text": "TabNet and FinTabNet means one styling format for the",
"orig": "TabNet and FinTabNet means one styling format for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 386.68,
"r_x1": 141.59,
"r_y1": 386.68,
"r_x2": 141.59,
"r_y2": 377.77,
"r_x3": 50.11,
"r_y3": 377.77,
"coord_origin": "TOPLEFT"
},
"text": "majority of the tables.",
"orig": "majority of the tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 148.7,
"r_y0": 386.68,
"r_x1": 286.37,
"r_y1": 386.68,
"r_x2": 286.37,
"r_y2": 377.77,
"r_x3": 148.7,
"r_y3": 377.77,
"coord_origin": "TOPLEFT"
},
"text": "Similar limitations appear also in",
"orig": "Similar limitations appear also in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 398.63,
"r_x1": 286.37,
"r_y1": 398.63,
"r_x2": 286.37,
"r_y2": 389.73,
"r_x3": 50.11,
"r_y3": 389.73,
"coord_origin": "TOPLEFT"
},
"text": "the type of table content, which in some cases (e.g. FinTab-",
"orig": "the type of table content, which in some cases (e.g. FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 410.59,
"r_x1": 286.37,
"r_y1": 410.59,
"r_x2": 286.37,
"r_y2": 401.68,
"r_x3": 50.11,
"r_y3": 401.68,
"coord_origin": "TOPLEFT"
},
"text": "Net) is restricted to a certain domain. Ultimately, the lack",
"orig": "Net) is restricted to a certain domain. Ultimately, the lack",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 422.54,
"r_x1": 286.37,
"r_y1": 422.54,
"r_x2": 286.37,
"r_y2": 413.64,
"r_x3": 50.11,
"r_y3": 413.64,
"coord_origin": "TOPLEFT"
},
"text": "of diversity in the training dataset damages the ability of the",
"orig": "of diversity in the training dataset damages the ability of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 434.5,
"r_x1": 216.4,
"r_y1": 434.5,
"r_x2": 216.4,
"r_y2": 425.59,
"r_x3": 50.11,
"r_y3": 425.59,
"coord_origin": "TOPLEFT"
},
"text": "models to generalize well on unseen data.",
"orig": "models to generalize well on unseen data.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 439.39,
"r": 286.37,
"b": 627.62,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 448.3,
"r_x1": 286.36,
"r_y1": 448.3,
"r_x2": 286.36,
"r_y2": 439.39,
"r_x3": 62.07,
"r_y3": 439.39,
"coord_origin": "TOPLEFT"
},
"text": "Motivated by those observations we aimed at generating",
"orig": "Motivated by those observations we aimed at generating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 460.25,
"r_x1": 172.14,
"r_y1": 460.25,
"r_x2": 172.14,
"r_y2": 451.34,
"r_x3": 50.11,
"r_y3": 451.34,
"coord_origin": "TOPLEFT"
},
"text": "a synthetic table dataset named",
"orig": "a synthetic table dataset named",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.15,
"r_y0": 460.02,
"r_x1": 224.71,
"r_y1": 460.02,
"r_x2": 224.71,
"r_y2": 451.43,
"r_x3": 174.15,
"r_y3": 451.43,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.71,
"r_y0": 460.25,
"r_x1": 286.37,
"r_y1": 460.25,
"r_x2": 286.37,
"r_y2": 451.34,
"r_x3": 224.71,
"r_y3": 451.34,
"coord_origin": "TOPLEFT"
},
"text": ". This approach",
"orig": ". This approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 472.21,
"r_x1": 286.37,
"r_y1": 472.21,
"r_x2": 286.37,
"r_y2": 463.3,
"r_x3": 50.11,
"r_y3": 463.3,
"coord_origin": "TOPLEFT"
},
"text": "offers control over: 1) the size of the dataset, 2) the table",
"orig": "offers control over: 1) the size of the dataset, 2) the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 484.16,
"r_x1": 286.37,
"r_y1": 484.16,
"r_x2": 286.37,
"r_y2": 475.26,
"r_x3": 50.11,
"r_y3": 475.26,
"coord_origin": "TOPLEFT"
},
"text": "structure, 3) the table style and 4) the type of content. The",
"orig": "structure, 3) the table style and 4) the type of content. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 496.12,
"r_x1": 286.37,
"r_y1": 496.12,
"r_x2": 286.37,
"r_y2": 487.21,
"r_x3": 50.11,
"r_y3": 487.21,
"coord_origin": "TOPLEFT"
},
"text": "complexity of the table structure is described by the size of",
"orig": "complexity of the table structure is described by the size of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 508.07,
"r_x1": 286.37,
"r_y1": 508.07,
"r_x2": 286.37,
"r_y2": 499.17,
"r_x3": 50.11,
"r_y3": 499.17,
"coord_origin": "TOPLEFT"
},
"text": "the table header and the table body, as well as the percentage",
"orig": "the table header and the table body, as well as the percentage",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 520.03,
"r_x1": 286.37,
"r_y1": 520.03,
"r_x2": 286.37,
"r_y2": 511.12,
"r_x3": 50.11,
"r_y3": 511.12,
"coord_origin": "TOPLEFT"
},
"text": "of the table cells covered by row spans and column spans.",
"orig": "of the table cells covered by row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 531.98,
"r_x1": 286.37,
"r_y1": 531.98,
"r_x2": 286.37,
"r_y2": 523.08,
"r_x3": 50.11,
"r_y3": 523.08,
"coord_origin": "TOPLEFT"
},
"text": "A set of carefully designed styling templates provides the",
"orig": "A set of carefully designed styling templates provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 543.94,
"r_x1": 286.37,
"r_y1": 543.94,
"r_x2": 286.37,
"r_y2": 535.03,
"r_x3": 50.11,
"r_y3": 535.03,
"coord_origin": "TOPLEFT"
},
"text": "basis to build a wide range of table appearances. Lastly, the",
"orig": "basis to build a wide range of table appearances. Lastly, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 555.89,
"r_x1": 286.37,
"r_y1": 555.89,
"r_x2": 286.37,
"r_y2": 546.99,
"r_x3": 50.11,
"r_y3": 546.99,
"coord_origin": "TOPLEFT"
},
"text": "table content is generated out of a curated collection of text",
"orig": "table content is generated out of a curated collection of text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 567.85,
"r_x1": 286.37,
"r_y1": 567.85,
"r_x2": 286.37,
"r_y2": 558.94,
"r_x3": 50.11,
"r_y3": 558.94,
"coord_origin": "TOPLEFT"
},
"text": "corpora. By controlling the size and scope of the synthetic",
"orig": "corpora. By controlling the size and scope of the synthetic",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 579.8,
"r_x1": 286.37,
"r_y1": 579.8,
"r_x2": 286.37,
"r_y2": 570.9,
"r_x3": 50.11,
"r_y3": 570.9,
"coord_origin": "TOPLEFT"
},
"text": "datasets we are able to train and evaluate our models in a",
"orig": "datasets we are able to train and evaluate our models in a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 591.76,
"r_x1": 286.37,
"r_y1": 591.76,
"r_x2": 286.37,
"r_y2": 582.85,
"r_x3": 50.11,
"r_y3": 582.85,
"coord_origin": "TOPLEFT"
},
"text": "variety of different conditions. For example, we can first",
"orig": "variety of different conditions. For example, we can first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 603.71,
"r_x1": 286.37,
"r_y1": 603.71,
"r_x2": 286.37,
"r_y2": 594.81,
"r_x3": 50.11,
"r_y3": 594.81,
"coord_origin": "TOPLEFT"
},
"text": "generate a highly diverse dataset to train our models and",
"orig": "generate a highly diverse dataset to train our models and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 615.67,
"r_x1": 286.37,
"r_y1": 615.67,
"r_x2": 286.37,
"r_y2": 606.76,
"r_x3": 50.11,
"r_y3": 606.76,
"coord_origin": "TOPLEFT"
},
"text": "then evaluate their performance on other synthetic datasets",
"orig": "then evaluate their performance on other synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 627.62,
"r_x1": 209.75,
"r_y1": 627.62,
"r_x2": 209.75,
"r_y2": 618.72,
"r_x3": 50.11,
"r_y3": 618.72,
"coord_origin": "TOPLEFT"
},
"text": "which are focused on a specific domain.",
"orig": "which are focused on a specific domain.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 632.51,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 641.42,
"r_x1": 286.36,
"r_y1": 641.42,
"r_x2": 286.36,
"r_y2": 632.51,
"r_x3": 62.07,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "In this regard, we have prepared four synthetic datasets,",
"orig": "In this regard, we have prepared four synthetic datasets,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "each one containing 150k examples. The corpora to gener-",
"orig": "each one containing 150k examples. The corpora to gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.43,
"r_x3": 50.11,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "ate the table text consists of the most frequent terms appear-",
"orig": "ate the table text consists of the most frequent terms appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "ing in PubTabNet and FinTabNet together with randomly",
"orig": "ing in PubTabNet and FinTabNet together with randomly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "generated text. The first two synthetic datasets have been",
"orig": "generated text. The first two synthetic datasets have been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "fine-tuned to mimic the appearance of the original datasets",
"orig": "fine-tuned to mimic the appearance of the original datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "but encompass more complicated table structures. The third",
"orig": "but encompass more complicated table structures. The third",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 310.68,
"t": 73.19,
"r": 542.95,
"b": 155.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 17,
"label": "text",
"bbox": {
"l": 412.33,
"t": 73.61,
"r": 430.9,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 442.86,
"t": 73.61,
"r": 464.45,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 477.79,
"t": 73.61,
"r": 494.94,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 508.28,
"t": 73.61,
"r": 536.91,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 317.06,
"t": 85.97,
"r": 361.64,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 417.86,
"t": 85.67,
"r": 425.38,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 449.9,
"t": 85.67,
"r": 457.42,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 476.4,
"t": 85.97,
"r": 496.33,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 512.63,
"t": 85.97,
"r": 532.56,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 317.06,
"t": 97.92,
"r": 359.43,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 417.86,
"t": 97.62,
"r": 425.38,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 449.9,
"t": 97.62,
"r": 457.42,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 476.4,
"t": 97.92,
"r": 496.33,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 513.46,
"t": 97.92,
"r": 531.73,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 317.06,
"t": 109.88,
"r": 359.98,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 417.86,
"t": 109.58,
"r": 425.38,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 450.81,
"t": 109.58,
"r": 456.5,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 476.4,
"t": 109.88,
"r": 496.33,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 511.25,
"t": 109.88,
"r": 533.95,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 317.06,
"t": 121.83,
"r": 400.38,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 417.86,
"t": 121.53,
"r": 425.38,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 449.9,
"t": 121.53,
"r": 457.42,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 476.4,
"t": 121.83,
"r": 496.33,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 512.63,
"t": 121.83,
"r": 532.56,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 317.06,
"t": 133.79,
"r": 375.17,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 417.86,
"t": 133.49,
"r": 425.38,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 449.9,
"t": 133.49,
"r": 457.42,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 476.4,
"t": 133.79,
"r": 496.33,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 512.63,
"t": 133.79,
"r": 532.56,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 317.06,
"t": 145.74,
"r": 369.39,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 417.86,
"t": 145.44,
"r": 425.38,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 449.9,
"t": 145.44,
"r": 457.42,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 476.4,
"t": 145.74,
"r": 496.33,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 512.63,
"t": 145.74,
"r": 532.56,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 9,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 167.66,
"r": 545.12,
"b": 224.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.967,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 176.57,
"r_x1": 344.62,
"r_y1": 176.57,
"r_x2": 344.62,
"r_y2": 167.66,
"r_x3": 308.86,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "Table 1:",
"orig": "Table 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 361.08,
"r_y0": 176.57,
"r_x1": 380.45,
"r_y1": 176.57,
"r_x2": 380.45,
"r_y2": 167.66,
"r_x3": 361.08,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "Both",
"orig": "Both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.57,
"r_y0": 176.34,
"r_x1": 468.68,
"r_y1": 176.34,
"r_x2": 468.68,
"r_y2": 167.75,
"r_x3": 386.57,
"r_y3": 167.75,
"coord_origin": "TOPLEFT"
},
"text": "\u201cCombined-Tabnet\u201d",
"orig": "\u201cCombined-Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 176.57,
"r_x1": 489.18,
"r_y1": 176.57,
"r_x2": 489.18,
"r_y2": 167.66,
"r_x3": 474.8,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.3,
"r_y0": 176.34,
"r_x1": 545.11,
"r_y1": 176.34,
"r_x2": 545.11,
"r_y2": 167.75,
"r_x3": 495.3,
"r_y3": 167.75,
"coord_origin": "TOPLEFT"
},
"text": "\u201dCombined-",
"orig": "\u201dCombined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 188.29,
"r_x1": 341.16,
"r_y1": 188.29,
"r_x2": 341.16,
"r_y2": 179.71,
"r_x3": 308.86,
"r_y3": 179.71,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet\u201d",
"orig": "Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.46,
"r_y0": 188.52,
"r_x1": 545.11,
"r_y1": 188.52,
"r_x2": 545.11,
"r_y2": 179.62,
"r_x3": 343.46,
"r_y3": 179.62,
"coord_origin": "TOPLEFT"
},
"text": "are variations of the following: (*) The Combined-",
"orig": "are variations of the following: (*) The Combined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 200.48,
"r_x1": 545.12,
"r_y1": 200.48,
"r_x2": 545.12,
"r_y2": 191.57,
"r_x3": 308.86,
"r_y3": 191.57,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet dataset is the processed combination of PubTabNet",
"orig": "Tabnet dataset is the processed combination of PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 212.43,
"r_x1": 545.11,
"r_y1": 212.43,
"r_x2": 545.11,
"r_y2": 203.53,
"r_x3": 308.86,
"r_y3": 203.53,
"coord_origin": "TOPLEFT"
},
"text": "and Fintabnet. (**) The combined dataset is the processed",
"orig": "and Fintabnet. (**) The combined dataset is the processed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 224.39,
"r_x1": 523.93,
"r_y1": 224.39,
"r_x2": 523.93,
"r_y2": 215.48,
"r_x3": 308.86,
"r_y3": 215.48,
"coord_origin": "TOPLEFT"
},
"text": "combination of PubTabNet, Fintabnet and TableBank.",
"orig": "combination of PubTabNet, Fintabnet and TableBank.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "text",
"bbox": {
"l": 308.86,
"t": 249.62,
"r": 545.12,
"b": 294.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.53,
"r_x1": 545.12,
"r_y1": 258.53,
"r_x2": 545.12,
"r_y2": 249.62,
"r_x3": 308.86,
"r_y3": 249.62,
"coord_origin": "TOPLEFT"
},
"text": "one adopts a colorful appearance with high contrast and the",
"orig": "one adopts a colorful appearance with high contrast and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.48,
"r_x1": 545.12,
"r_y1": 270.48,
"r_x2": 545.12,
"r_y2": 261.58,
"r_x3": 308.86,
"r_y3": 261.58,
"coord_origin": "TOPLEFT"
},
"text": "last one contains tables with sparse content. Lastly, we have",
"orig": "last one contains tables with sparse content. Lastly, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.44,
"r_x1": 545.12,
"r_y1": 282.44,
"r_x2": 545.12,
"r_y2": 273.53,
"r_x3": 308.86,
"r_y3": 273.53,
"coord_origin": "TOPLEFT"
},
"text": "combined all synthetic datasets into one big unified syn-",
"orig": "combined all synthetic datasets into one big unified syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.39,
"r_x1": 436.82,
"r_y1": 294.39,
"r_x2": 436.82,
"r_y2": 285.49,
"r_x3": 308.86,
"r_y3": 285.49,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset of 600k examples.",
"orig": "thetic dataset of 600k examples.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "text",
"bbox": {
"l": 320.82,
"t": 297.77,
"r": 542.74,
"b": 306.68,
"coord_origin": "TOPLEFT"
},
"confidence": 0.904,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 306.68,
"r_x1": 542.74,
"r_y1": 306.68,
"r_x2": 542.74,
"r_y2": 297.77,
"r_x3": 320.82,
"r_y3": 297.77,
"coord_origin": "TOPLEFT"
},
"text": "Tab. 1 summarizes the various attributes of the datasets.",
"orig": "Tab. 1 summarizes the various attributes of the datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 321.18,
"r": 444.94,
"b": 331.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.947,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 331.93,
"r_x1": 316.28,
"r_y1": 331.93,
"r_x2": 316.28,
"r_y2": 321.18,
"r_x3": 308.86,
"r_y3": 321.18,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.18,
"r_y0": 331.93,
"r_x1": 444.94,
"r_y1": 331.93,
"r_x2": 444.94,
"r_y2": 321.18,
"r_x3": 326.18,
"r_y3": 321.18,
"coord_origin": "TOPLEFT"
},
"text": "The TableFormer model",
"orig": "The TableFormer model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 341.94,
"r": 545.12,
"b": 446.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 350.85,
"r_x1": 545.11,
"r_y1": 350.85,
"r_x2": 545.11,
"r_y2": 341.94,
"r_x3": 320.82,
"r_y3": 341.94,
"coord_origin": "TOPLEFT"
},
"text": "Given the image of a table, TableFormer is able to pre-",
"orig": "Given the image of a table, TableFormer is able to pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 362.8,
"r_x1": 545.12,
"r_y1": 362.8,
"r_x2": 545.12,
"r_y2": 353.89,
"r_x3": 308.86,
"r_y3": 353.89,
"coord_origin": "TOPLEFT"
},
"text": "dict: 1) a sequence of tokens that represent the structure of",
"orig": "dict: 1) a sequence of tokens that represent the structure of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 374.76,
"r_x1": 545.12,
"r_y1": 374.76,
"r_x2": 545.12,
"r_y2": 365.85,
"r_x3": 308.86,
"r_y3": 365.85,
"coord_origin": "TOPLEFT"
},
"text": "a table, and 2) a bounding box coupled to a subset of those",
"orig": "a table, and 2) a bounding box coupled to a subset of those",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 386.71,
"r_x1": 545.12,
"r_y1": 386.71,
"r_x2": 545.12,
"r_y2": 377.8,
"r_x3": 308.86,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "tokens. The conversion of an image into a sequence of to-",
"orig": "tokens. The conversion of an image into a sequence of to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 398.67,
"r_x1": 545.12,
"r_y1": 398.67,
"r_x2": 545.12,
"r_y2": 389.76,
"r_x3": 308.86,
"r_y3": 389.76,
"coord_origin": "TOPLEFT"
},
"text": "kens is a well-known task [35, 16]. While attention is often",
"orig": "kens is a well-known task [35, 16]. While attention is often",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 410.62,
"r_x1": 545.12,
"r_y1": 410.62,
"r_x2": 545.12,
"r_y2": 401.71,
"r_x3": 308.86,
"r_y3": 401.71,
"coord_origin": "TOPLEFT"
},
"text": "used as an implicit method to associate each token of the",
"orig": "used as an implicit method to associate each token of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 422.58,
"r_x1": 545.12,
"r_y1": 422.58,
"r_x2": 545.12,
"r_y2": 413.67,
"r_x3": 308.86,
"r_y3": 413.67,
"coord_origin": "TOPLEFT"
},
"text": "sequence with a position in the original image, an explicit",
"orig": "sequence with a position in the original image, an explicit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 434.53,
"r_x1": 545.12,
"r_y1": 434.53,
"r_x2": 545.12,
"r_y2": 425.63,
"r_x3": 308.86,
"r_y3": 425.63,
"coord_origin": "TOPLEFT"
},
"text": "association between the individual table-cells and the image",
"orig": "association between the individual table-cells and the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 446.49,
"r_x1": 437.94,
"r_y1": 446.49,
"r_x2": 437.94,
"r_y2": 437.58,
"r_x3": 308.86,
"r_y3": 437.58,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes is also required.",
"orig": "bounding boxes is also required.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 457.69,
"r": 420.16,
"b": 467.55,
"coord_origin": "TOPLEFT"
},
"confidence": 0.938,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 467.55,
"r_x1": 323.14,
"r_y1": 467.55,
"r_x2": 323.14,
"r_y2": 457.69,
"r_x3": 308.86,
"r_y3": 457.69,
"coord_origin": "TOPLEFT"
},
"text": "4.1.",
"orig": "4.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 332.66,
"r_y0": 467.55,
"r_x1": 420.16,
"r_y1": 467.55,
"r_x2": 420.16,
"r_y2": 457.69,
"r_x3": 332.66,
"r_y3": 457.69,
"coord_origin": "TOPLEFT"
},
"text": "Model architecture.",
"orig": "Model architecture.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 476.77,
"r": 545.12,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 485.67,
"r_x1": 545.11,
"r_y1": 485.67,
"r_x2": 545.11,
"r_y2": 476.77,
"r_x3": 320.82,
"r_y3": 476.77,
"coord_origin": "TOPLEFT"
},
"text": "We now describe in detail the proposed method, which",
"orig": "We now describe in detail the proposed method, which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.63,
"r_x1": 509.02,
"r_y1": 497.63,
"r_x2": 509.02,
"r_y2": 488.72,
"r_x3": 308.86,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "is composed of three main components, see Fig.",
"orig": "is composed of three main components, see Fig.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.59,
"r_y0": 497.63,
"r_x1": 523.06,
"r_y1": 497.63,
"r_x2": 523.06,
"r_y2": 488.72,
"r_x3": 515.59,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 497.63,
"r_x1": 545.12,
"r_y1": 497.63,
"r_x2": 545.12,
"r_y2": 488.72,
"r_x3": 529.62,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "Our",
"orig": "Our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.35,
"r_x1": 406.35,
"r_y1": 509.35,
"r_x2": 406.35,
"r_y2": 500.76,
"r_x3": 308.86,
"r_y3": 500.76,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.87,
"r_y0": 509.58,
"r_x1": 545.11,
"r_y1": 509.58,
"r_x2": 545.11,
"r_y2": 500.68,
"r_x3": 408.87,
"r_y3": 500.68,
"coord_origin": "TOPLEFT"
},
"text": "encodes the input as a feature vec-",
"orig": "encodes the input as a feature vec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.54,
"r_x1": 409.39,
"r_y1": 521.54,
"r_x2": 409.39,
"r_y2": 512.63,
"r_x3": 308.86,
"r_y3": 512.63,
"coord_origin": "TOPLEFT"
},
"text": "tor of predefined length.",
"orig": "tor of predefined length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.73,
"r_y0": 521.54,
"r_x1": 545.12,
"r_y1": 521.54,
"r_x2": 545.12,
"r_y2": 512.63,
"r_x3": 416.73,
"r_y3": 512.63,
"coord_origin": "TOPLEFT"
},
"text": "The input feature vector of the",
"orig": "The input feature vector of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.49,
"r_x1": 436.19,
"r_y1": 533.49,
"r_x2": 436.19,
"r_y2": 524.59,
"r_x3": 308.86,
"r_y3": 524.59,
"coord_origin": "TOPLEFT"
},
"text": "encoded image is passed to the",
"orig": "encoded image is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.53,
"r_y0": 533.26,
"r_x1": 513.87,
"r_y1": 533.26,
"r_x2": 513.87,
"r_y2": 524.68,
"r_x3": 439.53,
"r_y3": 524.68,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 517.43,
"r_y0": 533.49,
"r_x1": 545.11,
"r_y1": 533.49,
"r_x2": 545.11,
"r_y2": 524.59,
"r_x3": 517.43,
"r_y3": 524.59,
"coord_origin": "TOPLEFT"
},
"text": "to pro-",
"orig": "to pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.45,
"r_x1": 545.12,
"r_y1": 545.45,
"r_x2": 545.12,
"r_y2": 536.54,
"r_x3": 308.86,
"r_y3": 536.54,
"coord_origin": "TOPLEFT"
},
"text": "duce a sequence of HTML tags that represent the structure",
"orig": "duce a sequence of HTML tags that represent the structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.4,
"r_x1": 358.55,
"r_y1": 557.4,
"r_x2": 358.55,
"r_y2": 548.5,
"r_x3": 308.86,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "of the table.",
"orig": "of the table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.19,
"r_y0": 557.4,
"r_x1": 545.12,
"r_y1": 557.4,
"r_x2": 545.12,
"r_y2": 548.5,
"r_x3": 365.19,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "With each prediction of an HTML standard",
"orig": "With each prediction of an HTML standard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.36,
"r_x1": 352.41,
"r_y1": 569.36,
"r_x2": 352.41,
"r_y2": 560.45,
"r_x3": 308.86,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "data cell (\u2018",
"orig": "data cell (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.41,
"r_y0": 569.14,
"r_x1": 360.16,
"r_y1": 569.14,
"r_x2": 360.16,
"r_y2": 560.29,
"r_x3": 352.41,
"r_y3": 560.29,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.16,
"r_y0": 569.36,
"r_x1": 367.91,
"r_y1": 569.36,
"r_x2": 367.91,
"r_y2": 560.45,
"r_x3": 360.16,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.91,
"r_y0": 569.14,
"r_x1": 375.66,
"r_y1": 569.14,
"r_x2": 375.66,
"r_y2": 560.29,
"r_x3": 367.91,
"r_y3": 560.29,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 375.66,
"r_y0": 569.36,
"r_x1": 545.11,
"r_y1": 569.36,
"r_x2": 545.11,
"r_y2": 560.45,
"r_x3": 375.66,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) the hidden state of that cell is passed to",
"orig": "\u2019) the hidden state of that cell is passed to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.31,
"r_x1": 545.11,
"r_y1": 581.31,
"r_x2": 545.11,
"r_y2": 572.41,
"r_x3": 308.86,
"r_y3": 572.41,
"coord_origin": "TOPLEFT"
},
"text": "the Cell BBox Decoder. As for spanning cells, such as row",
"orig": "the Cell BBox Decoder. As for spanning cells, such as row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.27,
"r_x1": 483.12,
"r_y1": 593.27,
"r_x2": 483.12,
"r_y2": 584.36,
"r_x3": 308.86,
"r_y3": 584.36,
"coord_origin": "TOPLEFT"
},
"text": "or column span, the tag is broken down to \u2018",
"orig": "or column span, the tag is broken down to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.12,
"r_y0": 593.05,
"r_x1": 490.87,
"r_y1": 593.05,
"r_x2": 490.87,
"r_y2": 584.2,
"r_x3": 483.12,
"r_y3": 584.2,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.87,
"r_y0": 593.27,
"r_x1": 545.11,
"r_y1": 593.27,
"r_x2": 545.11,
"r_y2": 584.36,
"r_x3": 490.87,
"r_y3": 584.36,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018rowspan=\u2019",
"orig": "\u2019, \u2018rowspan=\u2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.22,
"r_x1": 545.11,
"r_y1": 605.22,
"r_x2": 545.11,
"r_y2": 596.32,
"r_x3": 308.86,
"r_y3": 596.32,
"coord_origin": "TOPLEFT"
},
"text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.18,
"r_x1": 329.64,
"r_y1": 617.18,
"r_x2": 329.64,
"r_y2": 608.27,
"r_x3": 308.86,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "and \u2018",
"orig": "and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.65,
"r_y0": 616.96,
"r_x1": 337.39,
"r_y1": 616.96,
"r_x2": 337.39,
"r_y2": 608.11,
"r_x3": 329.65,
"r_y3": 608.11,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.39,
"r_y0": 617.18,
"r_x1": 468.59,
"r_y1": 617.18,
"r_x2": 468.59,
"r_y2": 608.27,
"r_x3": 337.39,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "\u2019. The hidden state attached to \u2018",
"orig": "\u2019. The hidden state attached to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.59,
"r_y0": 616.96,
"r_x1": 476.34,
"r_y1": 616.96,
"r_x2": 476.34,
"r_y2": 608.11,
"r_x3": 468.59,
"r_y3": 608.11,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.34,
"r_y0": 617.18,
"r_x1": 545.12,
"r_y1": 617.18,
"r_x2": 545.12,
"r_y2": 608.27,
"r_x3": 476.34,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 is passed to the",
"orig": "\u2019 is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.13,
"r_x1": 545.11,
"r_y1": 629.13,
"r_x2": 545.11,
"r_y2": 620.23,
"r_x3": 308.86,
"r_y3": 620.23,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder. A shared feed forward network (FFN)",
"orig": "Cell BBox Decoder. A shared feed forward network (FFN)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.09,
"r_x1": 545.12,
"r_y1": 641.09,
"r_x2": 545.12,
"r_y2": 632.18,
"r_x3": 308.86,
"r_y3": 632.18,
"coord_origin": "TOPLEFT"
},
"text": "receives the hidden states from the Structure Decoder, to",
"orig": "receives the hidden states from the Structure Decoder, to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.04,
"r_x1": 545.12,
"r_y1": 653.04,
"r_x2": 545.12,
"r_y2": 644.14,
"r_x3": 308.86,
"r_y3": 644.14,
"coord_origin": "TOPLEFT"
},
"text": "provide the final detection predictions of the bounding box",
"orig": "provide the final detection predictions of the bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.0,
"r_x1": 449.42,
"r_y1": 665.0,
"r_x2": 449.42,
"r_y2": 656.09,
"r_x3": 308.86,
"r_y3": 656.09,
"coord_origin": "TOPLEFT"
},
"text": "coordinates and their classification.",
"orig": "coordinates and their classification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 308.86,
"t": 668.26,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 677.22,
"r_x1": 431.91,
"r_y1": 677.22,
"r_x2": 431.91,
"r_y2": 668.26,
"r_x3": 320.82,
"r_y3": 668.26,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network.",
"orig": "CNN Backbone Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 439.5,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "A ResNet-18 CNN is the",
"orig": "A ResNet-18 CNN is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.11,
"r_y1": 689.24,
"r_x2": 545.11,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "backbone that receives the table image and encodes it as a",
"orig": "backbone that receives the table image and encodes it as a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "vector of predefined length. The network has been modified",
"orig": "vector of predefined length. The network has been modified",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "by removing the linear and pooling layer, as we are not per-",
"orig": "by removing the linear and pooling layer, as we are not per-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"8": {
"label": "table",
"id": 8,
"page_no": 3,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 310.68,
"t": 73.19,
"r": 542.95,
"b": 155.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 17,
"label": "text",
"bbox": {
"l": 412.33,
"t": 73.61,
"r": 430.9,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 442.86,
"t": 73.61,
"r": 464.45,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 477.79,
"t": 73.61,
"r": 494.94,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 508.28,
"t": 73.61,
"r": 536.91,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 317.06,
"t": 85.97,
"r": 361.64,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 417.86,
"t": 85.67,
"r": 425.38,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 449.9,
"t": 85.67,
"r": 457.42,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 476.4,
"t": 85.97,
"r": 496.33,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 512.63,
"t": 85.97,
"r": 532.56,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 317.06,
"t": 97.92,
"r": 359.43,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 417.86,
"t": 97.62,
"r": 425.38,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 449.9,
"t": 97.62,
"r": 457.42,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 476.4,
"t": 97.92,
"r": 496.33,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 513.46,
"t": 97.92,
"r": 531.73,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 317.06,
"t": 109.88,
"r": 359.98,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 417.86,
"t": 109.58,
"r": 425.38,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 450.81,
"t": 109.58,
"r": 456.5,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 476.4,
"t": 109.88,
"r": 496.33,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 511.25,
"t": 109.88,
"r": 533.95,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 317.06,
"t": 121.83,
"r": 400.38,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 417.86,
"t": 121.53,
"r": 425.38,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 449.9,
"t": 121.53,
"r": 457.42,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 476.4,
"t": 121.83,
"r": 496.33,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 512.63,
"t": 121.83,
"r": 532.56,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 317.06,
"t": 133.79,
"r": 375.17,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 417.86,
"t": 133.49,
"r": 425.38,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 449.9,
"t": 133.49,
"r": 457.42,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 476.4,
"t": 133.79,
"r": 496.33,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 512.63,
"t": 133.79,
"r": 532.56,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 317.06,
"t": 145.74,
"r": 369.39,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 417.86,
"t": 145.44,
"r": 425.38,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 449.9,
"t": 145.44,
"r": 457.42,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 476.4,
"t": 145.74,
"r": 496.33,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 512.63,
"t": 145.74,
"r": 532.56,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 412.33,
"t": 73.61,
"r": 430.9,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Tags",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 442.86,
"t": 73.61,
"r": 464.45,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Bbox",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 477.79,
"t": 73.61,
"r": 494.94,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "Size",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 508.28,
"t": 73.61,
"r": 536.91,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "Format",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 85.97,
"r": 361.64,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "PubTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 85.67,
"r": 425.38,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 85.67,
"r": 457.42,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 85.97,
"r": 496.33,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "509k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 85.97,
"r": 532.56,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 97.92,
"r": 359.43,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "FinTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 97.62,
"r": 425.38,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 97.62,
"r": 457.42,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 97.92,
"r": 496.33,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "112k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.46,
"t": 97.92,
"r": 531.73,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PDF",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 109.88,
"r": 359.98,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableBank",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 109.58,
"r": 425.38,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 450.81,
"t": 109.58,
"r": 456.5,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 109.88,
"r": 496.33,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "145k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 511.25,
"t": 109.88,
"r": 533.95,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "JPEG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 121.83,
"r": 400.38,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined-Tabnet(*)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 121.53,
"r": 425.38,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 121.53,
"r": 457.42,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 121.83,
"r": 496.33,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "400k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 121.83,
"r": 532.56,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 133.79,
"r": 375.17,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined(**)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 133.49,
"r": 425.38,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 133.49,
"r": 457.42,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 133.79,
"r": 496.33,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "500k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 133.79,
"r": 532.56,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 145.74,
"r": 369.39,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "SynthTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 145.44,
"r": 425.38,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 145.44,
"r": 457.42,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 145.74,
"r": 496.33,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "600k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 145.74,
"r": 532.56,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
}
]
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 10,
"page_no": 3,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 96.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.961,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "amount of such tables, and kept only those ones ranging",
"orig": "amount of such tables, and kept only those ones ranging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 212.28,
"r_y1": 96.07,
"r_x2": 212.28,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "between 1*1 and 20*10 (rows/columns).",
"orig": "between 1*1 and 20*10 (rows/columns).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)."
},
{
"label": "text",
"id": 1,
"page_no": 3,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 100.96,
"r": 286.37,
"b": 313.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 109.87,
"r_x1": 286.37,
"r_y1": 109.87,
"r_x2": 286.37,
"r_y2": 100.96,
"r_x3": 62.07,
"r_y3": 100.96,
"coord_origin": "TOPLEFT"
},
"text": "The availability of the bounding boxes for all table cells",
"orig": "The availability of the bounding boxes for all table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 121.82,
"r_x1": 286.37,
"r_y1": 121.82,
"r_x2": 286.37,
"r_y2": 112.92,
"r_x3": 50.11,
"r_y3": 112.92,
"coord_origin": "TOPLEFT"
},
"text": "is essential to train our models. In order to distinguish be-",
"orig": "is essential to train our models. In order to distinguish be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 133.78,
"r_x1": 286.37,
"r_y1": 133.78,
"r_x2": 286.37,
"r_y2": 124.87,
"r_x3": 50.11,
"r_y3": 124.87,
"coord_origin": "TOPLEFT"
},
"text": "tween empty and non-empty bounding boxes, we have in-",
"orig": "tween empty and non-empty bounding boxes, we have in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 145.73,
"r_x1": 286.37,
"r_y1": 145.73,
"r_x2": 286.37,
"r_y2": 136.83,
"r_x3": 50.11,
"r_y3": 136.83,
"coord_origin": "TOPLEFT"
},
"text": "troduced a binary class in the annotation. Unfortunately, the",
"orig": "troduced a binary class in the annotation. Unfortunately, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 157.69,
"r_x1": 286.37,
"r_y1": 157.69,
"r_x2": 286.37,
"r_y2": 148.78,
"r_x3": 50.11,
"r_y3": 148.78,
"coord_origin": "TOPLEFT"
},
"text": "original datasets either omit the bounding boxes for whole",
"orig": "original datasets either omit the bounding boxes for whole",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 169.64,
"r_x1": 286.37,
"r_y1": 169.64,
"r_x2": 286.37,
"r_y2": 160.74,
"r_x3": 50.11,
"r_y3": 160.74,
"coord_origin": "TOPLEFT"
},
"text": "tables (e.g. TableBank) or they narrow their scope only to",
"orig": "tables (e.g. TableBank) or they narrow their scope only to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 181.6,
"r_x1": 286.37,
"r_y1": 181.6,
"r_x2": 286.37,
"r_y2": 172.69,
"r_x3": 50.11,
"r_y3": 172.69,
"coord_origin": "TOPLEFT"
},
"text": "non-empty cells. Therefore, it was imperative to introduce",
"orig": "non-empty cells. Therefore, it was imperative to introduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 193.55,
"r_x1": 286.37,
"r_y1": 193.55,
"r_x2": 286.37,
"r_y2": 184.65,
"r_x3": 50.11,
"r_y3": 184.65,
"coord_origin": "TOPLEFT"
},
"text": "a data pre-processing procedure that generates the missing",
"orig": "a data pre-processing procedure that generates the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 205.51,
"r_x1": 286.37,
"r_y1": 205.51,
"r_x2": 286.37,
"r_y2": 196.6,
"r_x3": 50.11,
"r_y3": 196.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes out of the annotation information. This pro-",
"orig": "bounding boxes out of the annotation information. This pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 217.46,
"r_x1": 286.37,
"r_y1": 217.46,
"r_x2": 286.37,
"r_y2": 208.56,
"r_x3": 50.11,
"r_y3": 208.56,
"coord_origin": "TOPLEFT"
},
"text": "cedure first parses the provided table structure and calcu-",
"orig": "cedure first parses the provided table structure and calcu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 229.42,
"r_x1": 286.37,
"r_y1": 229.42,
"r_x2": 286.37,
"r_y2": 220.51,
"r_x3": 50.11,
"r_y3": 220.51,
"coord_origin": "TOPLEFT"
},
"text": "lates the dimensions of the most fine-grained grid that cov-",
"orig": "lates the dimensions of the most fine-grained grid that cov-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 241.37,
"r_x1": 286.37,
"r_y1": 241.37,
"r_x2": 286.37,
"r_y2": 232.47,
"r_x3": 50.11,
"r_y3": 232.47,
"coord_origin": "TOPLEFT"
},
"text": "ers the table structure. Notice that each table cell may oc-",
"orig": "ers the table structure. Notice that each table cell may oc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 253.33,
"r_x1": 286.37,
"r_y1": 253.33,
"r_x2": 286.37,
"r_y2": 244.42,
"r_x3": 50.11,
"r_y3": 244.42,
"coord_origin": "TOPLEFT"
},
"text": "cupy multiple grid squares due to row or column spans. In",
"orig": "cupy multiple grid squares due to row or column spans. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 265.28,
"r_x1": 286.37,
"r_y1": 265.28,
"r_x2": 286.37,
"r_y2": 256.38,
"r_x3": 50.11,
"r_y3": 256.38,
"coord_origin": "TOPLEFT"
},
"text": "case of PubTabNet we had to compute missing bounding",
"orig": "case of PubTabNet we had to compute missing bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 277.24,
"r_x1": 286.37,
"r_y1": 277.24,
"r_x2": 286.37,
"r_y2": 268.33,
"r_x3": 50.11,
"r_y3": 268.33,
"coord_origin": "TOPLEFT"
},
"text": "boxes for 48% of the simple and 69% of the complex ta-",
"orig": "boxes for 48% of the simple and 69% of the complex ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 289.2,
"r_x1": 68.65,
"r_y1": 289.2,
"r_x2": 68.65,
"r_y2": 280.29,
"r_x3": 50.11,
"r_y3": 280.29,
"coord_origin": "TOPLEFT"
},
"text": "bles.",
"orig": "bles.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.57,
"r_y0": 289.2,
"r_x1": 286.37,
"r_y1": 289.2,
"r_x2": 286.37,
"r_y2": 280.29,
"r_x3": 75.57,
"r_y3": 280.29,
"coord_origin": "TOPLEFT"
},
"text": "Regarding FinTabNet, 68% of the simple and 98%",
"orig": "Regarding FinTabNet, 68% of the simple and 98%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 301.15,
"r_x1": 286.37,
"r_y1": 301.15,
"r_x2": 286.37,
"r_y2": 292.24,
"r_x3": 50.11,
"r_y3": 292.24,
"coord_origin": "TOPLEFT"
},
"text": "of the complex tables require the generation of bounding",
"orig": "of the complex tables require the generation of bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 313.11,
"r_x1": 75.7,
"r_y1": 313.11,
"r_x2": 75.7,
"r_y2": 304.2,
"r_x3": 50.11,
"r_y3": 304.2,
"coord_origin": "TOPLEFT"
},
"text": "boxes.",
"orig": "boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."
},
{
"label": "text",
"id": 4,
"page_no": 3,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 318.0,
"r": 286.37,
"b": 434.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 326.9,
"r_x1": 286.36,
"r_y1": 326.9,
"r_x2": 286.36,
"r_y2": 318.0,
"r_x3": 62.07,
"r_y3": 318.0,
"coord_origin": "TOPLEFT"
},
"text": "As it is illustrated in Fig. 2, the table distributions from",
"orig": "As it is illustrated in Fig. 2, the table distributions from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 338.86,
"r_x1": 286.37,
"r_y1": 338.86,
"r_x2": 286.37,
"r_y2": 329.95,
"r_x3": 50.11,
"r_y3": 329.95,
"coord_origin": "TOPLEFT"
},
"text": "all datasets are skewed towards simpler structures with",
"orig": "all datasets are skewed towards simpler structures with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 350.81,
"r_x1": 286.37,
"r_y1": 350.81,
"r_x2": 286.37,
"r_y2": 341.91,
"r_x3": 50.11,
"r_y3": 341.91,
"coord_origin": "TOPLEFT"
},
"text": "fewer number of rows/columns. Additionally, there is very",
"orig": "fewer number of rows/columns. Additionally, there is very",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 362.77,
"r_x1": 286.37,
"r_y1": 362.77,
"r_x2": 286.37,
"r_y2": 353.86,
"r_x3": 50.11,
"r_y3": 353.86,
"coord_origin": "TOPLEFT"
},
"text": "limited variance in the table styles, which in case of Pub-",
"orig": "limited variance in the table styles, which in case of Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 374.72,
"r_x1": 286.37,
"r_y1": 374.72,
"r_x2": 286.37,
"r_y2": 365.82,
"r_x3": 50.11,
"r_y3": 365.82,
"coord_origin": "TOPLEFT"
},
"text": "TabNet and FinTabNet means one styling format for the",
"orig": "TabNet and FinTabNet means one styling format for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 386.68,
"r_x1": 141.59,
"r_y1": 386.68,
"r_x2": 141.59,
"r_y2": 377.77,
"r_x3": 50.11,
"r_y3": 377.77,
"coord_origin": "TOPLEFT"
},
"text": "majority of the tables.",
"orig": "majority of the tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 148.7,
"r_y0": 386.68,
"r_x1": 286.37,
"r_y1": 386.68,
"r_x2": 286.37,
"r_y2": 377.77,
"r_x3": 148.7,
"r_y3": 377.77,
"coord_origin": "TOPLEFT"
},
"text": "Similar limitations appear also in",
"orig": "Similar limitations appear also in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 398.63,
"r_x1": 286.37,
"r_y1": 398.63,
"r_x2": 286.37,
"r_y2": 389.73,
"r_x3": 50.11,
"r_y3": 389.73,
"coord_origin": "TOPLEFT"
},
"text": "the type of table content, which in some cases (e.g. FinTab-",
"orig": "the type of table content, which in some cases (e.g. FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 410.59,
"r_x1": 286.37,
"r_y1": 410.59,
"r_x2": 286.37,
"r_y2": 401.68,
"r_x3": 50.11,
"r_y3": 401.68,
"coord_origin": "TOPLEFT"
},
"text": "Net) is restricted to a certain domain. Ultimately, the lack",
"orig": "Net) is restricted to a certain domain. Ultimately, the lack",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 422.54,
"r_x1": 286.37,
"r_y1": 422.54,
"r_x2": 286.37,
"r_y2": 413.64,
"r_x3": 50.11,
"r_y3": 413.64,
"coord_origin": "TOPLEFT"
},
"text": "of diversity in the training dataset damages the ability of the",
"orig": "of diversity in the training dataset damages the ability of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 434.5,
"r_x1": 216.4,
"r_y1": 434.5,
"r_x2": 216.4,
"r_y2": 425.59,
"r_x3": 50.11,
"r_y3": 425.59,
"coord_origin": "TOPLEFT"
},
"text": "models to generalize well on unseen data.",
"orig": "models to generalize well on unseen data.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data."
},
{
"label": "text",
"id": 3,
"page_no": 3,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 439.39,
"r": 286.37,
"b": 627.62,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 448.3,
"r_x1": 286.36,
"r_y1": 448.3,
"r_x2": 286.36,
"r_y2": 439.39,
"r_x3": 62.07,
"r_y3": 439.39,
"coord_origin": "TOPLEFT"
},
"text": "Motivated by those observations we aimed at generating",
"orig": "Motivated by those observations we aimed at generating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 460.25,
"r_x1": 172.14,
"r_y1": 460.25,
"r_x2": 172.14,
"r_y2": 451.34,
"r_x3": 50.11,
"r_y3": 451.34,
"coord_origin": "TOPLEFT"
},
"text": "a synthetic table dataset named",
"orig": "a synthetic table dataset named",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.15,
"r_y0": 460.02,
"r_x1": 224.71,
"r_y1": 460.02,
"r_x2": 224.71,
"r_y2": 451.43,
"r_x3": 174.15,
"r_y3": 451.43,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.71,
"r_y0": 460.25,
"r_x1": 286.37,
"r_y1": 460.25,
"r_x2": 286.37,
"r_y2": 451.34,
"r_x3": 224.71,
"r_y3": 451.34,
"coord_origin": "TOPLEFT"
},
"text": ". This approach",
"orig": ". This approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 472.21,
"r_x1": 286.37,
"r_y1": 472.21,
"r_x2": 286.37,
"r_y2": 463.3,
"r_x3": 50.11,
"r_y3": 463.3,
"coord_origin": "TOPLEFT"
},
"text": "offers control over: 1) the size of the dataset, 2) the table",
"orig": "offers control over: 1) the size of the dataset, 2) the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 484.16,
"r_x1": 286.37,
"r_y1": 484.16,
"r_x2": 286.37,
"r_y2": 475.26,
"r_x3": 50.11,
"r_y3": 475.26,
"coord_origin": "TOPLEFT"
},
"text": "structure, 3) the table style and 4) the type of content. The",
"orig": "structure, 3) the table style and 4) the type of content. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 496.12,
"r_x1": 286.37,
"r_y1": 496.12,
"r_x2": 286.37,
"r_y2": 487.21,
"r_x3": 50.11,
"r_y3": 487.21,
"coord_origin": "TOPLEFT"
},
"text": "complexity of the table structure is described by the size of",
"orig": "complexity of the table structure is described by the size of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 508.07,
"r_x1": 286.37,
"r_y1": 508.07,
"r_x2": 286.37,
"r_y2": 499.17,
"r_x3": 50.11,
"r_y3": 499.17,
"coord_origin": "TOPLEFT"
},
"text": "the table header and the table body, as well as the percentage",
"orig": "the table header and the table body, as well as the percentage",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 520.03,
"r_x1": 286.37,
"r_y1": 520.03,
"r_x2": 286.37,
"r_y2": 511.12,
"r_x3": 50.11,
"r_y3": 511.12,
"coord_origin": "TOPLEFT"
},
"text": "of the table cells covered by row spans and column spans.",
"orig": "of the table cells covered by row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 531.98,
"r_x1": 286.37,
"r_y1": 531.98,
"r_x2": 286.37,
"r_y2": 523.08,
"r_x3": 50.11,
"r_y3": 523.08,
"coord_origin": "TOPLEFT"
},
"text": "A set of carefully designed styling templates provides the",
"orig": "A set of carefully designed styling templates provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 543.94,
"r_x1": 286.37,
"r_y1": 543.94,
"r_x2": 286.37,
"r_y2": 535.03,
"r_x3": 50.11,
"r_y3": 535.03,
"coord_origin": "TOPLEFT"
},
"text": "basis to build a wide range of table appearances. Lastly, the",
"orig": "basis to build a wide range of table appearances. Lastly, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 555.89,
"r_x1": 286.37,
"r_y1": 555.89,
"r_x2": 286.37,
"r_y2": 546.99,
"r_x3": 50.11,
"r_y3": 546.99,
"coord_origin": "TOPLEFT"
},
"text": "table content is generated out of a curated collection of text",
"orig": "table content is generated out of a curated collection of text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 567.85,
"r_x1": 286.37,
"r_y1": 567.85,
"r_x2": 286.37,
"r_y2": 558.94,
"r_x3": 50.11,
"r_y3": 558.94,
"coord_origin": "TOPLEFT"
},
"text": "corpora. By controlling the size and scope of the synthetic",
"orig": "corpora. By controlling the size and scope of the synthetic",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 579.8,
"r_x1": 286.37,
"r_y1": 579.8,
"r_x2": 286.37,
"r_y2": 570.9,
"r_x3": 50.11,
"r_y3": 570.9,
"coord_origin": "TOPLEFT"
},
"text": "datasets we are able to train and evaluate our models in a",
"orig": "datasets we are able to train and evaluate our models in a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 591.76,
"r_x1": 286.37,
"r_y1": 591.76,
"r_x2": 286.37,
"r_y2": 582.85,
"r_x3": 50.11,
"r_y3": 582.85,
"coord_origin": "TOPLEFT"
},
"text": "variety of different conditions. For example, we can first",
"orig": "variety of different conditions. For example, we can first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 603.71,
"r_x1": 286.37,
"r_y1": 603.71,
"r_x2": 286.37,
"r_y2": 594.81,
"r_x3": 50.11,
"r_y3": 594.81,
"coord_origin": "TOPLEFT"
},
"text": "generate a highly diverse dataset to train our models and",
"orig": "generate a highly diverse dataset to train our models and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 615.67,
"r_x1": 286.37,
"r_y1": 615.67,
"r_x2": 286.37,
"r_y2": 606.76,
"r_x3": 50.11,
"r_y3": 606.76,
"coord_origin": "TOPLEFT"
},
"text": "then evaluate their performance on other synthetic datasets",
"orig": "then evaluate their performance on other synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 627.62,
"r_x1": 209.75,
"r_y1": 627.62,
"r_x2": 209.75,
"r_y2": 618.72,
"r_x3": 50.11,
"r_y3": 618.72,
"coord_origin": "TOPLEFT"
},
"text": "which are focused on a specific domain.",
"orig": "which are focused on a specific domain.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain."
},
{
"label": "text",
"id": 5,
"page_no": 3,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 632.51,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 641.42,
"r_x1": 286.36,
"r_y1": 641.42,
"r_x2": 286.36,
"r_y2": 632.51,
"r_x3": 62.07,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "In this regard, we have prepared four synthetic datasets,",
"orig": "In this regard, we have prepared four synthetic datasets,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "each one containing 150k examples. The corpora to gener-",
"orig": "each one containing 150k examples. The corpora to gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.43,
"r_x3": 50.11,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "ate the table text consists of the most frequent terms appear-",
"orig": "ate the table text consists of the most frequent terms appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "ing in PubTabNet and FinTabNet together with randomly",
"orig": "ing in PubTabNet and FinTabNet together with randomly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "generated text. The first two synthetic datasets have been",
"orig": "generated text. The first two synthetic datasets have been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "fine-tuned to mimic the appearance of the original datasets",
"orig": "fine-tuned to mimic the appearance of the original datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "but encompass more complicated table structures. The third",
"orig": "but encompass more complicated table structures. The third",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third"
},
{
"label": "table",
"id": 8,
"page_no": 3,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 310.68,
"t": 73.19,
"r": 542.95,
"b": 155.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 17,
"label": "text",
"bbox": {
"l": 412.33,
"t": 73.61,
"r": 430.9,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 442.86,
"t": 73.61,
"r": 464.45,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 477.79,
"t": 73.61,
"r": 494.94,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 508.28,
"t": 73.61,
"r": 536.91,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 317.06,
"t": 85.97,
"r": 361.64,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 417.86,
"t": 85.67,
"r": 425.38,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 449.9,
"t": 85.67,
"r": 457.42,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 476.4,
"t": 85.97,
"r": 496.33,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 512.63,
"t": 85.97,
"r": 532.56,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 317.06,
"t": 97.92,
"r": 359.43,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 417.86,
"t": 97.62,
"r": 425.38,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 449.9,
"t": 97.62,
"r": 457.42,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 476.4,
"t": 97.92,
"r": 496.33,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 513.46,
"t": 97.92,
"r": 531.73,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 317.06,
"t": 109.88,
"r": 359.98,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 417.86,
"t": 109.58,
"r": 425.38,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 450.81,
"t": 109.58,
"r": 456.5,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 476.4,
"t": 109.88,
"r": 496.33,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 511.25,
"t": 109.88,
"r": 533.95,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 317.06,
"t": 121.83,
"r": 400.38,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 417.86,
"t": 121.53,
"r": 425.38,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 449.9,
"t": 121.53,
"r": 457.42,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 476.4,
"t": 121.83,
"r": 496.33,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 512.63,
"t": 121.83,
"r": 532.56,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 317.06,
"t": 133.79,
"r": 375.17,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 417.86,
"t": 133.49,
"r": 425.38,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 449.9,
"t": 133.49,
"r": 457.42,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 476.4,
"t": 133.79,
"r": 496.33,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 512.63,
"t": 133.79,
"r": 532.56,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 317.06,
"t": 145.74,
"r": 369.39,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 417.86,
"t": 145.44,
"r": 425.38,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 449.9,
"t": 145.44,
"r": 457.42,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 476.4,
"t": 145.74,
"r": 496.33,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 512.63,
"t": 145.74,
"r": 532.56,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 412.33,
"t": 73.61,
"r": 430.9,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Tags",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 442.86,
"t": 73.61,
"r": 464.45,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Bbox",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 477.79,
"t": 73.61,
"r": 494.94,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "Size",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 508.28,
"t": 73.61,
"r": 536.91,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "Format",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 85.97,
"r": 361.64,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "PubTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 85.67,
"r": 425.38,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 85.67,
"r": 457.42,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 85.97,
"r": 496.33,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "509k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 85.97,
"r": 532.56,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 97.92,
"r": 359.43,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "FinTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 97.62,
"r": 425.38,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 97.62,
"r": 457.42,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 97.92,
"r": 496.33,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "112k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.46,
"t": 97.92,
"r": 531.73,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PDF",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 109.88,
"r": 359.98,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableBank",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 109.58,
"r": 425.38,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 450.81,
"t": 109.58,
"r": 456.5,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 109.88,
"r": 496.33,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "145k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 511.25,
"t": 109.88,
"r": 533.95,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "JPEG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 121.83,
"r": 400.38,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined-Tabnet(*)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 121.53,
"r": 425.38,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 121.53,
"r": 457.42,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 121.83,
"r": 496.33,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "400k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 121.83,
"r": 532.56,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 133.79,
"r": 375.17,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined(**)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 133.49,
"r": 425.38,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 133.49,
"r": 457.42,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 133.79,
"r": 496.33,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "500k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 133.79,
"r": 532.56,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 145.74,
"r": 369.39,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "SynthTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 145.44,
"r": 425.38,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 145.44,
"r": 457.42,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 145.74,
"r": 496.33,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "600k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 145.74,
"r": 532.56,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 9,
"page_no": 3,
"cluster": {
"id": 9,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 167.66,
"r": 545.12,
"b": 224.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.967,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 176.57,
"r_x1": 344.62,
"r_y1": 176.57,
"r_x2": 344.62,
"r_y2": 167.66,
"r_x3": 308.86,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "Table 1:",
"orig": "Table 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 361.08,
"r_y0": 176.57,
"r_x1": 380.45,
"r_y1": 176.57,
"r_x2": 380.45,
"r_y2": 167.66,
"r_x3": 361.08,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "Both",
"orig": "Both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.57,
"r_y0": 176.34,
"r_x1": 468.68,
"r_y1": 176.34,
"r_x2": 468.68,
"r_y2": 167.75,
"r_x3": 386.57,
"r_y3": 167.75,
"coord_origin": "TOPLEFT"
},
"text": "\u201cCombined-Tabnet\u201d",
"orig": "\u201cCombined-Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 176.57,
"r_x1": 489.18,
"r_y1": 176.57,
"r_x2": 489.18,
"r_y2": 167.66,
"r_x3": 474.8,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.3,
"r_y0": 176.34,
"r_x1": 545.11,
"r_y1": 176.34,
"r_x2": 545.11,
"r_y2": 167.75,
"r_x3": 495.3,
"r_y3": 167.75,
"coord_origin": "TOPLEFT"
},
"text": "\u201dCombined-",
"orig": "\u201dCombined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 188.29,
"r_x1": 341.16,
"r_y1": 188.29,
"r_x2": 341.16,
"r_y2": 179.71,
"r_x3": 308.86,
"r_y3": 179.71,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet\u201d",
"orig": "Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.46,
"r_y0": 188.52,
"r_x1": 545.11,
"r_y1": 188.52,
"r_x2": 545.11,
"r_y2": 179.62,
"r_x3": 343.46,
"r_y3": 179.62,
"coord_origin": "TOPLEFT"
},
"text": "are variations of the following: (*) The Combined-",
"orig": "are variations of the following: (*) The Combined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 200.48,
"r_x1": 545.12,
"r_y1": 200.48,
"r_x2": 545.12,
"r_y2": 191.57,
"r_x3": 308.86,
"r_y3": 191.57,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet dataset is the processed combination of PubTabNet",
"orig": "Tabnet dataset is the processed combination of PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 212.43,
"r_x1": 545.11,
"r_y1": 212.43,
"r_x2": 545.11,
"r_y2": 203.53,
"r_x3": 308.86,
"r_y3": 203.53,
"coord_origin": "TOPLEFT"
},
"text": "and Fintabnet. (**) The combined dataset is the processed",
"orig": "and Fintabnet. (**) The combined dataset is the processed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 224.39,
"r_x1": 523.93,
"r_y1": 224.39,
"r_x2": 523.93,
"r_y2": 215.48,
"r_x3": 308.86,
"r_y3": 215.48,
"coord_origin": "TOPLEFT"
},
"text": "combination of PubTabNet, Fintabnet and TableBank.",
"orig": "combination of PubTabNet, Fintabnet and TableBank.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 1: Both \"Combined-Tabnet\" and \"CombinedTabnet\" are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank."
},
{
"label": "text",
"id": 6,
"page_no": 3,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 308.86,
"t": 249.62,
"r": 545.12,
"b": 294.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.53,
"r_x1": 545.12,
"r_y1": 258.53,
"r_x2": 545.12,
"r_y2": 249.62,
"r_x3": 308.86,
"r_y3": 249.62,
"coord_origin": "TOPLEFT"
},
"text": "one adopts a colorful appearance with high contrast and the",
"orig": "one adopts a colorful appearance with high contrast and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.48,
"r_x1": 545.12,
"r_y1": 270.48,
"r_x2": 545.12,
"r_y2": 261.58,
"r_x3": 308.86,
"r_y3": 261.58,
"coord_origin": "TOPLEFT"
},
"text": "last one contains tables with sparse content. Lastly, we have",
"orig": "last one contains tables with sparse content. Lastly, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.44,
"r_x1": 545.12,
"r_y1": 282.44,
"r_x2": 545.12,
"r_y2": 273.53,
"r_x3": 308.86,
"r_y3": 273.53,
"coord_origin": "TOPLEFT"
},
"text": "combined all synthetic datasets into one big unified syn-",
"orig": "combined all synthetic datasets into one big unified syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.39,
"r_x1": 436.82,
"r_y1": 294.39,
"r_x2": 436.82,
"r_y2": 285.49,
"r_x3": 308.86,
"r_y3": 285.49,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset of 600k examples.",
"orig": "thetic dataset of 600k examples.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples."
},
{
"label": "text",
"id": 13,
"page_no": 3,
"cluster": {
"id": 13,
"label": "text",
"bbox": {
"l": 320.82,
"t": 297.77,
"r": 542.74,
"b": 306.68,
"coord_origin": "TOPLEFT"
},
"confidence": 0.904,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 306.68,
"r_x1": 542.74,
"r_y1": 306.68,
"r_x2": 542.74,
"r_y2": 297.77,
"r_x3": 320.82,
"r_y3": 297.77,
"coord_origin": "TOPLEFT"
},
"text": "Tab. 1 summarizes the various attributes of the datasets.",
"orig": "Tab. 1 summarizes the various attributes of the datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Tab. 1 summarizes the various attributes of the datasets."
},
{
"label": "section_header",
"id": 11,
"page_no": 3,
"cluster": {
"id": 11,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 321.18,
"r": 444.94,
"b": 331.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.947,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 331.93,
"r_x1": 316.28,
"r_y1": 331.93,
"r_x2": 316.28,
"r_y2": 321.18,
"r_x3": 308.86,
"r_y3": 321.18,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.18,
"r_y0": 331.93,
"r_x1": 444.94,
"r_y1": 331.93,
"r_x2": 444.94,
"r_y2": 321.18,
"r_x3": 326.18,
"r_y3": 321.18,
"coord_origin": "TOPLEFT"
},
"text": "The TableFormer model",
"orig": "The TableFormer model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. The TableFormer model"
},
{
"label": "text",
"id": 0,
"page_no": 3,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 341.94,
"r": 545.12,
"b": 446.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 350.85,
"r_x1": 545.11,
"r_y1": 350.85,
"r_x2": 545.11,
"r_y2": 341.94,
"r_x3": 320.82,
"r_y3": 341.94,
"coord_origin": "TOPLEFT"
},
"text": "Given the image of a table, TableFormer is able to pre-",
"orig": "Given the image of a table, TableFormer is able to pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 362.8,
"r_x1": 545.12,
"r_y1": 362.8,
"r_x2": 545.12,
"r_y2": 353.89,
"r_x3": 308.86,
"r_y3": 353.89,
"coord_origin": "TOPLEFT"
},
"text": "dict: 1) a sequence of tokens that represent the structure of",
"orig": "dict: 1) a sequence of tokens that represent the structure of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 374.76,
"r_x1": 545.12,
"r_y1": 374.76,
"r_x2": 545.12,
"r_y2": 365.85,
"r_x3": 308.86,
"r_y3": 365.85,
"coord_origin": "TOPLEFT"
},
"text": "a table, and 2) a bounding box coupled to a subset of those",
"orig": "a table, and 2) a bounding box coupled to a subset of those",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 386.71,
"r_x1": 545.12,
"r_y1": 386.71,
"r_x2": 545.12,
"r_y2": 377.8,
"r_x3": 308.86,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "tokens. The conversion of an image into a sequence of to-",
"orig": "tokens. The conversion of an image into a sequence of to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 398.67,
"r_x1": 545.12,
"r_y1": 398.67,
"r_x2": 545.12,
"r_y2": 389.76,
"r_x3": 308.86,
"r_y3": 389.76,
"coord_origin": "TOPLEFT"
},
"text": "kens is a well-known task [35, 16]. While attention is often",
"orig": "kens is a well-known task [35, 16]. While attention is often",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 410.62,
"r_x1": 545.12,
"r_y1": 410.62,
"r_x2": 545.12,
"r_y2": 401.71,
"r_x3": 308.86,
"r_y3": 401.71,
"coord_origin": "TOPLEFT"
},
"text": "used as an implicit method to associate each token of the",
"orig": "used as an implicit method to associate each token of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 422.58,
"r_x1": 545.12,
"r_y1": 422.58,
"r_x2": 545.12,
"r_y2": 413.67,
"r_x3": 308.86,
"r_y3": 413.67,
"coord_origin": "TOPLEFT"
},
"text": "sequence with a position in the original image, an explicit",
"orig": "sequence with a position in the original image, an explicit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 434.53,
"r_x1": 545.12,
"r_y1": 434.53,
"r_x2": 545.12,
"r_y2": 425.63,
"r_x3": 308.86,
"r_y3": 425.63,
"coord_origin": "TOPLEFT"
},
"text": "association between the individual table-cells and the image",
"orig": "association between the individual table-cells and the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 446.49,
"r_x1": 437.94,
"r_y1": 446.49,
"r_x2": 437.94,
"r_y2": 437.58,
"r_x3": 308.86,
"r_y3": 437.58,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes is also required.",
"orig": "bounding boxes is also required.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required."
},
{
"label": "section_header",
"id": 12,
"page_no": 3,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 457.69,
"r": 420.16,
"b": 467.55,
"coord_origin": "TOPLEFT"
},
"confidence": 0.938,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 467.55,
"r_x1": 323.14,
"r_y1": 467.55,
"r_x2": 323.14,
"r_y2": 457.69,
"r_x3": 308.86,
"r_y3": 457.69,
"coord_origin": "TOPLEFT"
},
"text": "4.1.",
"orig": "4.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 332.66,
"r_y0": 467.55,
"r_x1": 420.16,
"r_y1": 467.55,
"r_x2": 420.16,
"r_y2": 457.69,
"r_x3": 332.66,
"r_y3": 457.69,
"coord_origin": "TOPLEFT"
},
"text": "Model architecture.",
"orig": "Model architecture.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4.1. Model architecture."
},
{
"label": "text",
"id": 2,
"page_no": 3,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 476.77,
"r": 545.12,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 485.67,
"r_x1": 545.11,
"r_y1": 485.67,
"r_x2": 545.11,
"r_y2": 476.77,
"r_x3": 320.82,
"r_y3": 476.77,
"coord_origin": "TOPLEFT"
},
"text": "We now describe in detail the proposed method, which",
"orig": "We now describe in detail the proposed method, which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.63,
"r_x1": 509.02,
"r_y1": 497.63,
"r_x2": 509.02,
"r_y2": 488.72,
"r_x3": 308.86,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "is composed of three main components, see Fig.",
"orig": "is composed of three main components, see Fig.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.59,
"r_y0": 497.63,
"r_x1": 523.06,
"r_y1": 497.63,
"r_x2": 523.06,
"r_y2": 488.72,
"r_x3": 515.59,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 497.63,
"r_x1": 545.12,
"r_y1": 497.63,
"r_x2": 545.12,
"r_y2": 488.72,
"r_x3": 529.62,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "Our",
"orig": "Our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.35,
"r_x1": 406.35,
"r_y1": 509.35,
"r_x2": 406.35,
"r_y2": 500.76,
"r_x3": 308.86,
"r_y3": 500.76,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.87,
"r_y0": 509.58,
"r_x1": 545.11,
"r_y1": 509.58,
"r_x2": 545.11,
"r_y2": 500.68,
"r_x3": 408.87,
"r_y3": 500.68,
"coord_origin": "TOPLEFT"
},
"text": "encodes the input as a feature vec-",
"orig": "encodes the input as a feature vec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.54,
"r_x1": 409.39,
"r_y1": 521.54,
"r_x2": 409.39,
"r_y2": 512.63,
"r_x3": 308.86,
"r_y3": 512.63,
"coord_origin": "TOPLEFT"
},
"text": "tor of predefined length.",
"orig": "tor of predefined length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.73,
"r_y0": 521.54,
"r_x1": 545.12,
"r_y1": 521.54,
"r_x2": 545.12,
"r_y2": 512.63,
"r_x3": 416.73,
"r_y3": 512.63,
"coord_origin": "TOPLEFT"
},
"text": "The input feature vector of the",
"orig": "The input feature vector of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.49,
"r_x1": 436.19,
"r_y1": 533.49,
"r_x2": 436.19,
"r_y2": 524.59,
"r_x3": 308.86,
"r_y3": 524.59,
"coord_origin": "TOPLEFT"
},
"text": "encoded image is passed to the",
"orig": "encoded image is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.53,
"r_y0": 533.26,
"r_x1": 513.87,
"r_y1": 533.26,
"r_x2": 513.87,
"r_y2": 524.68,
"r_x3": 439.53,
"r_y3": 524.68,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 517.43,
"r_y0": 533.49,
"r_x1": 545.11,
"r_y1": 533.49,
"r_x2": 545.11,
"r_y2": 524.59,
"r_x3": 517.43,
"r_y3": 524.59,
"coord_origin": "TOPLEFT"
},
"text": "to pro-",
"orig": "to pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.45,
"r_x1": 545.12,
"r_y1": 545.45,
"r_x2": 545.12,
"r_y2": 536.54,
"r_x3": 308.86,
"r_y3": 536.54,
"coord_origin": "TOPLEFT"
},
"text": "duce a sequence of HTML tags that represent the structure",
"orig": "duce a sequence of HTML tags that represent the structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.4,
"r_x1": 358.55,
"r_y1": 557.4,
"r_x2": 358.55,
"r_y2": 548.5,
"r_x3": 308.86,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "of the table.",
"orig": "of the table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.19,
"r_y0": 557.4,
"r_x1": 545.12,
"r_y1": 557.4,
"r_x2": 545.12,
"r_y2": 548.5,
"r_x3": 365.19,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "With each prediction of an HTML standard",
"orig": "With each prediction of an HTML standard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.36,
"r_x1": 352.41,
"r_y1": 569.36,
"r_x2": 352.41,
"r_y2": 560.45,
"r_x3": 308.86,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "data cell (\u2018",
"orig": "data cell (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.41,
"r_y0": 569.14,
"r_x1": 360.16,
"r_y1": 569.14,
"r_x2": 360.16,
"r_y2": 560.29,
"r_x3": 352.41,
"r_y3": 560.29,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.16,
"r_y0": 569.36,
"r_x1": 367.91,
"r_y1": 569.36,
"r_x2": 367.91,
"r_y2": 560.45,
"r_x3": 360.16,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.91,
"r_y0": 569.14,
"r_x1": 375.66,
"r_y1": 569.14,
"r_x2": 375.66,
"r_y2": 560.29,
"r_x3": 367.91,
"r_y3": 560.29,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 375.66,
"r_y0": 569.36,
"r_x1": 545.11,
"r_y1": 569.36,
"r_x2": 545.11,
"r_y2": 560.45,
"r_x3": 375.66,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) the hidden state of that cell is passed to",
"orig": "\u2019) the hidden state of that cell is passed to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.31,
"r_x1": 545.11,
"r_y1": 581.31,
"r_x2": 545.11,
"r_y2": 572.41,
"r_x3": 308.86,
"r_y3": 572.41,
"coord_origin": "TOPLEFT"
},
"text": "the Cell BBox Decoder. As for spanning cells, such as row",
"orig": "the Cell BBox Decoder. As for spanning cells, such as row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.27,
"r_x1": 483.12,
"r_y1": 593.27,
"r_x2": 483.12,
"r_y2": 584.36,
"r_x3": 308.86,
"r_y3": 584.36,
"coord_origin": "TOPLEFT"
},
"text": "or column span, the tag is broken down to \u2018",
"orig": "or column span, the tag is broken down to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.12,
"r_y0": 593.05,
"r_x1": 490.87,
"r_y1": 593.05,
"r_x2": 490.87,
"r_y2": 584.2,
"r_x3": 483.12,
"r_y3": 584.2,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.87,
"r_y0": 593.27,
"r_x1": 545.11,
"r_y1": 593.27,
"r_x2": 545.11,
"r_y2": 584.36,
"r_x3": 490.87,
"r_y3": 584.36,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018rowspan=\u2019",
"orig": "\u2019, \u2018rowspan=\u2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.22,
"r_x1": 545.11,
"r_y1": 605.22,
"r_x2": 545.11,
"r_y2": 596.32,
"r_x3": 308.86,
"r_y3": 596.32,
"coord_origin": "TOPLEFT"
},
"text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.18,
"r_x1": 329.64,
"r_y1": 617.18,
"r_x2": 329.64,
"r_y2": 608.27,
"r_x3": 308.86,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "and \u2018",
"orig": "and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.65,
"r_y0": 616.96,
"r_x1": 337.39,
"r_y1": 616.96,
"r_x2": 337.39,
"r_y2": 608.11,
"r_x3": 329.65,
"r_y3": 608.11,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.39,
"r_y0": 617.18,
"r_x1": 468.59,
"r_y1": 617.18,
"r_x2": 468.59,
"r_y2": 608.27,
"r_x3": 337.39,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "\u2019. The hidden state attached to \u2018",
"orig": "\u2019. The hidden state attached to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.59,
"r_y0": 616.96,
"r_x1": 476.34,
"r_y1": 616.96,
"r_x2": 476.34,
"r_y2": 608.11,
"r_x3": 468.59,
"r_y3": 608.11,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.34,
"r_y0": 617.18,
"r_x1": 545.12,
"r_y1": 617.18,
"r_x2": 545.12,
"r_y2": 608.27,
"r_x3": 476.34,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 is passed to the",
"orig": "\u2019 is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.13,
"r_x1": 545.11,
"r_y1": 629.13,
"r_x2": 545.11,
"r_y2": 620.23,
"r_x3": 308.86,
"r_y3": 620.23,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder. A shared feed forward network (FFN)",
"orig": "Cell BBox Decoder. A shared feed forward network (FFN)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.09,
"r_x1": 545.12,
"r_y1": 641.09,
"r_x2": 545.12,
"r_y2": 632.18,
"r_x3": 308.86,
"r_y3": 632.18,
"coord_origin": "TOPLEFT"
},
"text": "receives the hidden states from the Structure Decoder, to",
"orig": "receives the hidden states from the Structure Decoder, to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.04,
"r_x1": 545.12,
"r_y1": 653.04,
"r_x2": 545.12,
"r_y2": 644.14,
"r_x3": 308.86,
"r_y3": 644.14,
"coord_origin": "TOPLEFT"
},
"text": "provide the final detection predictions of the bounding box",
"orig": "provide the final detection predictions of the bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.0,
"r_x1": 449.42,
"r_y1": 665.0,
"r_x2": 449.42,
"r_y2": 656.09,
"r_x3": 308.86,
"r_y3": 656.09,
"coord_origin": "TOPLEFT"
},
"text": "coordinates and their classification.",
"orig": "coordinates and their classification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification."
},
{
"label": "text",
"id": 7,
"page_no": 3,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 308.86,
"t": 668.26,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 677.22,
"r_x1": 431.91,
"r_y1": 677.22,
"r_x2": 431.91,
"r_y2": 668.26,
"r_x3": 320.82,
"r_y3": 668.26,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network.",
"orig": "CNN Backbone Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 439.5,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "A ResNet-18 CNN is the",
"orig": "A ResNet-18 CNN is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.11,
"r_y1": 689.24,
"r_x2": 545.11,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "backbone that receives the table image and encodes it as a",
"orig": "backbone that receives the table image and encodes it as a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "vector of predefined length. The network has been modified",
"orig": "vector of predefined length. The network has been modified",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "by removing the linear and pooling layer, as we are not per-",
"orig": "by removing the linear and pooling layer, as we are not per-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-"
},
{
"label": "page_footer",
"id": 14,
"page_no": 3,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4"
}
],
"body": [
{
"label": "text",
"id": 10,
"page_no": 3,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 96.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.961,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "amount of such tables, and kept only those ones ranging",
"orig": "amount of such tables, and kept only those ones ranging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 212.28,
"r_y1": 96.07,
"r_x2": 212.28,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "between 1*1 and 20*10 (rows/columns).",
"orig": "between 1*1 and 20*10 (rows/columns).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)."
},
{
"label": "text",
"id": 1,
"page_no": 3,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 100.96,
"r": 286.37,
"b": 313.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 109.87,
"r_x1": 286.37,
"r_y1": 109.87,
"r_x2": 286.37,
"r_y2": 100.96,
"r_x3": 62.07,
"r_y3": 100.96,
"coord_origin": "TOPLEFT"
},
"text": "The availability of the bounding boxes for all table cells",
"orig": "The availability of the bounding boxes for all table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 121.82,
"r_x1": 286.37,
"r_y1": 121.82,
"r_x2": 286.37,
"r_y2": 112.92,
"r_x3": 50.11,
"r_y3": 112.92,
"coord_origin": "TOPLEFT"
},
"text": "is essential to train our models. In order to distinguish be-",
"orig": "is essential to train our models. In order to distinguish be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 133.78,
"r_x1": 286.37,
"r_y1": 133.78,
"r_x2": 286.37,
"r_y2": 124.87,
"r_x3": 50.11,
"r_y3": 124.87,
"coord_origin": "TOPLEFT"
},
"text": "tween empty and non-empty bounding boxes, we have in-",
"orig": "tween empty and non-empty bounding boxes, we have in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 145.73,
"r_x1": 286.37,
"r_y1": 145.73,
"r_x2": 286.37,
"r_y2": 136.83,
"r_x3": 50.11,
"r_y3": 136.83,
"coord_origin": "TOPLEFT"
},
"text": "troduced a binary class in the annotation. Unfortunately, the",
"orig": "troduced a binary class in the annotation. Unfortunately, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 157.69,
"r_x1": 286.37,
"r_y1": 157.69,
"r_x2": 286.37,
"r_y2": 148.78,
"r_x3": 50.11,
"r_y3": 148.78,
"coord_origin": "TOPLEFT"
},
"text": "original datasets either omit the bounding boxes for whole",
"orig": "original datasets either omit the bounding boxes for whole",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 169.64,
"r_x1": 286.37,
"r_y1": 169.64,
"r_x2": 286.37,
"r_y2": 160.74,
"r_x3": 50.11,
"r_y3": 160.74,
"coord_origin": "TOPLEFT"
},
"text": "tables (e.g. TableBank) or they narrow their scope only to",
"orig": "tables (e.g. TableBank) or they narrow their scope only to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 181.6,
"r_x1": 286.37,
"r_y1": 181.6,
"r_x2": 286.37,
"r_y2": 172.69,
"r_x3": 50.11,
"r_y3": 172.69,
"coord_origin": "TOPLEFT"
},
"text": "non-empty cells. Therefore, it was imperative to introduce",
"orig": "non-empty cells. Therefore, it was imperative to introduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 193.55,
"r_x1": 286.37,
"r_y1": 193.55,
"r_x2": 286.37,
"r_y2": 184.65,
"r_x3": 50.11,
"r_y3": 184.65,
"coord_origin": "TOPLEFT"
},
"text": "a data pre-processing procedure that generates the missing",
"orig": "a data pre-processing procedure that generates the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 205.51,
"r_x1": 286.37,
"r_y1": 205.51,
"r_x2": 286.37,
"r_y2": 196.6,
"r_x3": 50.11,
"r_y3": 196.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes out of the annotation information. This pro-",
"orig": "bounding boxes out of the annotation information. This pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 217.46,
"r_x1": 286.37,
"r_y1": 217.46,
"r_x2": 286.37,
"r_y2": 208.56,
"r_x3": 50.11,
"r_y3": 208.56,
"coord_origin": "TOPLEFT"
},
"text": "cedure first parses the provided table structure and calcu-",
"orig": "cedure first parses the provided table structure and calcu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 229.42,
"r_x1": 286.37,
"r_y1": 229.42,
"r_x2": 286.37,
"r_y2": 220.51,
"r_x3": 50.11,
"r_y3": 220.51,
"coord_origin": "TOPLEFT"
},
"text": "lates the dimensions of the most fine-grained grid that cov-",
"orig": "lates the dimensions of the most fine-grained grid that cov-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 241.37,
"r_x1": 286.37,
"r_y1": 241.37,
"r_x2": 286.37,
"r_y2": 232.47,
"r_x3": 50.11,
"r_y3": 232.47,
"coord_origin": "TOPLEFT"
},
"text": "ers the table structure. Notice that each table cell may oc-",
"orig": "ers the table structure. Notice that each table cell may oc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 253.33,
"r_x1": 286.37,
"r_y1": 253.33,
"r_x2": 286.37,
"r_y2": 244.42,
"r_x3": 50.11,
"r_y3": 244.42,
"coord_origin": "TOPLEFT"
},
"text": "cupy multiple grid squares due to row or column spans. In",
"orig": "cupy multiple grid squares due to row or column spans. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 265.28,
"r_x1": 286.37,
"r_y1": 265.28,
"r_x2": 286.37,
"r_y2": 256.38,
"r_x3": 50.11,
"r_y3": 256.38,
"coord_origin": "TOPLEFT"
},
"text": "case of PubTabNet we had to compute missing bounding",
"orig": "case of PubTabNet we had to compute missing bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 277.24,
"r_x1": 286.37,
"r_y1": 277.24,
"r_x2": 286.37,
"r_y2": 268.33,
"r_x3": 50.11,
"r_y3": 268.33,
"coord_origin": "TOPLEFT"
},
"text": "boxes for 48% of the simple and 69% of the complex ta-",
"orig": "boxes for 48% of the simple and 69% of the complex ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 289.2,
"r_x1": 68.65,
"r_y1": 289.2,
"r_x2": 68.65,
"r_y2": 280.29,
"r_x3": 50.11,
"r_y3": 280.29,
"coord_origin": "TOPLEFT"
},
"text": "bles.",
"orig": "bles.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.57,
"r_y0": 289.2,
"r_x1": 286.37,
"r_y1": 289.2,
"r_x2": 286.37,
"r_y2": 280.29,
"r_x3": 75.57,
"r_y3": 280.29,
"coord_origin": "TOPLEFT"
},
"text": "Regarding FinTabNet, 68% of the simple and 98%",
"orig": "Regarding FinTabNet, 68% of the simple and 98%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 301.15,
"r_x1": 286.37,
"r_y1": 301.15,
"r_x2": 286.37,
"r_y2": 292.24,
"r_x3": 50.11,
"r_y3": 292.24,
"coord_origin": "TOPLEFT"
},
"text": "of the complex tables require the generation of bounding",
"orig": "of the complex tables require the generation of bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 313.11,
"r_x1": 75.7,
"r_y1": 313.11,
"r_x2": 75.7,
"r_y2": 304.2,
"r_x3": 50.11,
"r_y3": 304.2,
"coord_origin": "TOPLEFT"
},
"text": "boxes.",
"orig": "boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."
},
{
"label": "text",
"id": 4,
"page_no": 3,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 318.0,
"r": 286.37,
"b": 434.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 326.9,
"r_x1": 286.36,
"r_y1": 326.9,
"r_x2": 286.36,
"r_y2": 318.0,
"r_x3": 62.07,
"r_y3": 318.0,
"coord_origin": "TOPLEFT"
},
"text": "As it is illustrated in Fig. 2, the table distributions from",
"orig": "As it is illustrated in Fig. 2, the table distributions from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 338.86,
"r_x1": 286.37,
"r_y1": 338.86,
"r_x2": 286.37,
"r_y2": 329.95,
"r_x3": 50.11,
"r_y3": 329.95,
"coord_origin": "TOPLEFT"
},
"text": "all datasets are skewed towards simpler structures with",
"orig": "all datasets are skewed towards simpler structures with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 350.81,
"r_x1": 286.37,
"r_y1": 350.81,
"r_x2": 286.37,
"r_y2": 341.91,
"r_x3": 50.11,
"r_y3": 341.91,
"coord_origin": "TOPLEFT"
},
"text": "fewer number of rows/columns. Additionally, there is very",
"orig": "fewer number of rows/columns. Additionally, there is very",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 362.77,
"r_x1": 286.37,
"r_y1": 362.77,
"r_x2": 286.37,
"r_y2": 353.86,
"r_x3": 50.11,
"r_y3": 353.86,
"coord_origin": "TOPLEFT"
},
"text": "limited variance in the table styles, which in case of Pub-",
"orig": "limited variance in the table styles, which in case of Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 374.72,
"r_x1": 286.37,
"r_y1": 374.72,
"r_x2": 286.37,
"r_y2": 365.82,
"r_x3": 50.11,
"r_y3": 365.82,
"coord_origin": "TOPLEFT"
},
"text": "TabNet and FinTabNet means one styling format for the",
"orig": "TabNet and FinTabNet means one styling format for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 386.68,
"r_x1": 141.59,
"r_y1": 386.68,
"r_x2": 141.59,
"r_y2": 377.77,
"r_x3": 50.11,
"r_y3": 377.77,
"coord_origin": "TOPLEFT"
},
"text": "majority of the tables.",
"orig": "majority of the tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 148.7,
"r_y0": 386.68,
"r_x1": 286.37,
"r_y1": 386.68,
"r_x2": 286.37,
"r_y2": 377.77,
"r_x3": 148.7,
"r_y3": 377.77,
"coord_origin": "TOPLEFT"
},
"text": "Similar limitations appear also in",
"orig": "Similar limitations appear also in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 398.63,
"r_x1": 286.37,
"r_y1": 398.63,
"r_x2": 286.37,
"r_y2": 389.73,
"r_x3": 50.11,
"r_y3": 389.73,
"coord_origin": "TOPLEFT"
},
"text": "the type of table content, which in some cases (e.g. FinTab-",
"orig": "the type of table content, which in some cases (e.g. FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 410.59,
"r_x1": 286.37,
"r_y1": 410.59,
"r_x2": 286.37,
"r_y2": 401.68,
"r_x3": 50.11,
"r_y3": 401.68,
"coord_origin": "TOPLEFT"
},
"text": "Net) is restricted to a certain domain. Ultimately, the lack",
"orig": "Net) is restricted to a certain domain. Ultimately, the lack",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 422.54,
"r_x1": 286.37,
"r_y1": 422.54,
"r_x2": 286.37,
"r_y2": 413.64,
"r_x3": 50.11,
"r_y3": 413.64,
"coord_origin": "TOPLEFT"
},
"text": "of diversity in the training dataset damages the ability of the",
"orig": "of diversity in the training dataset damages the ability of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 434.5,
"r_x1": 216.4,
"r_y1": 434.5,
"r_x2": 216.4,
"r_y2": 425.59,
"r_x3": 50.11,
"r_y3": 425.59,
"coord_origin": "TOPLEFT"
},
"text": "models to generalize well on unseen data.",
"orig": "models to generalize well on unseen data.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data."
},
{
"label": "text",
"id": 3,
"page_no": 3,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 439.39,
"r": 286.37,
"b": 627.62,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 448.3,
"r_x1": 286.36,
"r_y1": 448.3,
"r_x2": 286.36,
"r_y2": 439.39,
"r_x3": 62.07,
"r_y3": 439.39,
"coord_origin": "TOPLEFT"
},
"text": "Motivated by those observations we aimed at generating",
"orig": "Motivated by those observations we aimed at generating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 460.25,
"r_x1": 172.14,
"r_y1": 460.25,
"r_x2": 172.14,
"r_y2": 451.34,
"r_x3": 50.11,
"r_y3": 451.34,
"coord_origin": "TOPLEFT"
},
"text": "a synthetic table dataset named",
"orig": "a synthetic table dataset named",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.15,
"r_y0": 460.02,
"r_x1": 224.71,
"r_y1": 460.02,
"r_x2": 224.71,
"r_y2": 451.43,
"r_x3": 174.15,
"r_y3": 451.43,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.71,
"r_y0": 460.25,
"r_x1": 286.37,
"r_y1": 460.25,
"r_x2": 286.37,
"r_y2": 451.34,
"r_x3": 224.71,
"r_y3": 451.34,
"coord_origin": "TOPLEFT"
},
"text": ". This approach",
"orig": ". This approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 472.21,
"r_x1": 286.37,
"r_y1": 472.21,
"r_x2": 286.37,
"r_y2": 463.3,
"r_x3": 50.11,
"r_y3": 463.3,
"coord_origin": "TOPLEFT"
},
"text": "offers control over: 1) the size of the dataset, 2) the table",
"orig": "offers control over: 1) the size of the dataset, 2) the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 484.16,
"r_x1": 286.37,
"r_y1": 484.16,
"r_x2": 286.37,
"r_y2": 475.26,
"r_x3": 50.11,
"r_y3": 475.26,
"coord_origin": "TOPLEFT"
},
"text": "structure, 3) the table style and 4) the type of content. The",
"orig": "structure, 3) the table style and 4) the type of content. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 496.12,
"r_x1": 286.37,
"r_y1": 496.12,
"r_x2": 286.37,
"r_y2": 487.21,
"r_x3": 50.11,
"r_y3": 487.21,
"coord_origin": "TOPLEFT"
},
"text": "complexity of the table structure is described by the size of",
"orig": "complexity of the table structure is described by the size of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 508.07,
"r_x1": 286.37,
"r_y1": 508.07,
"r_x2": 286.37,
"r_y2": 499.17,
"r_x3": 50.11,
"r_y3": 499.17,
"coord_origin": "TOPLEFT"
},
"text": "the table header and the table body, as well as the percentage",
"orig": "the table header and the table body, as well as the percentage",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 520.03,
"r_x1": 286.37,
"r_y1": 520.03,
"r_x2": 286.37,
"r_y2": 511.12,
"r_x3": 50.11,
"r_y3": 511.12,
"coord_origin": "TOPLEFT"
},
"text": "of the table cells covered by row spans and column spans.",
"orig": "of the table cells covered by row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 531.98,
"r_x1": 286.37,
"r_y1": 531.98,
"r_x2": 286.37,
"r_y2": 523.08,
"r_x3": 50.11,
"r_y3": 523.08,
"coord_origin": "TOPLEFT"
},
"text": "A set of carefully designed styling templates provides the",
"orig": "A set of carefully designed styling templates provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 543.94,
"r_x1": 286.37,
"r_y1": 543.94,
"r_x2": 286.37,
"r_y2": 535.03,
"r_x3": 50.11,
"r_y3": 535.03,
"coord_origin": "TOPLEFT"
},
"text": "basis to build a wide range of table appearances. Lastly, the",
"orig": "basis to build a wide range of table appearances. Lastly, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 555.89,
"r_x1": 286.37,
"r_y1": 555.89,
"r_x2": 286.37,
"r_y2": 546.99,
"r_x3": 50.11,
"r_y3": 546.99,
"coord_origin": "TOPLEFT"
},
"text": "table content is generated out of a curated collection of text",
"orig": "table content is generated out of a curated collection of text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 567.85,
"r_x1": 286.37,
"r_y1": 567.85,
"r_x2": 286.37,
"r_y2": 558.94,
"r_x3": 50.11,
"r_y3": 558.94,
"coord_origin": "TOPLEFT"
},
"text": "corpora. By controlling the size and scope of the synthetic",
"orig": "corpora. By controlling the size and scope of the synthetic",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 579.8,
"r_x1": 286.37,
"r_y1": 579.8,
"r_x2": 286.37,
"r_y2": 570.9,
"r_x3": 50.11,
"r_y3": 570.9,
"coord_origin": "TOPLEFT"
},
"text": "datasets we are able to train and evaluate our models in a",
"orig": "datasets we are able to train and evaluate our models in a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 591.76,
"r_x1": 286.37,
"r_y1": 591.76,
"r_x2": 286.37,
"r_y2": 582.85,
"r_x3": 50.11,
"r_y3": 582.85,
"coord_origin": "TOPLEFT"
},
"text": "variety of different conditions. For example, we can first",
"orig": "variety of different conditions. For example, we can first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 603.71,
"r_x1": 286.37,
"r_y1": 603.71,
"r_x2": 286.37,
"r_y2": 594.81,
"r_x3": 50.11,
"r_y3": 594.81,
"coord_origin": "TOPLEFT"
},
"text": "generate a highly diverse dataset to train our models and",
"orig": "generate a highly diverse dataset to train our models and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 615.67,
"r_x1": 286.37,
"r_y1": 615.67,
"r_x2": 286.37,
"r_y2": 606.76,
"r_x3": 50.11,
"r_y3": 606.76,
"coord_origin": "TOPLEFT"
},
"text": "then evaluate their performance on other synthetic datasets",
"orig": "then evaluate their performance on other synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 627.62,
"r_x1": 209.75,
"r_y1": 627.62,
"r_x2": 209.75,
"r_y2": 618.72,
"r_x3": 50.11,
"r_y3": 618.72,
"coord_origin": "TOPLEFT"
},
"text": "which are focused on a specific domain.",
"orig": "which are focused on a specific domain.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain."
},
{
"label": "text",
"id": 5,
"page_no": 3,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 632.51,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 641.42,
"r_x1": 286.36,
"r_y1": 641.42,
"r_x2": 286.36,
"r_y2": 632.51,
"r_x3": 62.07,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "In this regard, we have prepared four synthetic datasets,",
"orig": "In this regard, we have prepared four synthetic datasets,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "each one containing 150k examples. The corpora to gener-",
"orig": "each one containing 150k examples. The corpora to gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.43,
"r_x3": 50.11,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "ate the table text consists of the most frequent terms appear-",
"orig": "ate the table text consists of the most frequent terms appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "ing in PubTabNet and FinTabNet together with randomly",
"orig": "ing in PubTabNet and FinTabNet together with randomly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "generated text. The first two synthetic datasets have been",
"orig": "generated text. The first two synthetic datasets have been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "fine-tuned to mimic the appearance of the original datasets",
"orig": "fine-tuned to mimic the appearance of the original datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "but encompass more complicated table structures. The third",
"orig": "but encompass more complicated table structures. The third",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third"
},
{
"label": "table",
"id": 8,
"page_no": 3,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 310.68,
"t": 73.19,
"r": 542.95,
"b": 155.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 17,
"label": "text",
"bbox": {
"l": 412.33,
"t": 73.61,
"r": 430.9,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.33,
"r_y0": 82.52,
"r_x1": 430.9,
"r_y1": 82.52,
"r_x2": 430.9,
"r_y2": 73.61,
"r_x3": 412.33,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 442.86,
"t": 73.61,
"r": 464.45,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.86,
"r_y0": 82.52,
"r_x1": 464.45,
"r_y1": 82.52,
"r_x2": 464.45,
"r_y2": 73.61,
"r_x3": 442.86,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 477.79,
"t": 73.61,
"r": 494.94,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.79,
"r_y0": 82.52,
"r_x1": 494.94,
"r_y1": 82.52,
"r_x2": 494.94,
"r_y2": 73.61,
"r_x3": 477.79,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 508.28,
"t": 73.61,
"r": 536.91,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.28,
"r_y0": 82.52,
"r_x1": 536.91,
"r_y1": 82.52,
"r_x2": 536.91,
"r_y2": 73.61,
"r_x3": 508.28,
"r_y3": 73.61,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 317.06,
"t": 85.97,
"r": 361.64,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 94.87,
"r_x1": 361.64,
"r_y1": 94.87,
"r_x2": 361.64,
"r_y2": 85.97,
"r_x3": 317.06,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 417.86,
"t": 85.67,
"r": 425.38,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 94.88,
"r_x1": 425.38,
"r_y1": 94.88,
"r_x2": 425.38,
"r_y2": 85.67,
"r_x3": 417.86,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 449.9,
"t": 85.67,
"r": 457.42,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.88,
"r_x1": 457.42,
"r_y1": 94.88,
"r_x2": 457.42,
"r_y2": 85.67,
"r_x3": 449.9,
"r_y3": 85.67,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 476.4,
"t": 85.97,
"r": 496.33,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.87,
"r_x1": 496.33,
"r_y1": 94.87,
"r_x2": 496.33,
"r_y2": 85.97,
"r_x3": 476.4,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 512.63,
"t": 85.97,
"r": 532.56,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 94.87,
"r_x1": 532.56,
"r_y1": 94.87,
"r_x2": 532.56,
"r_y2": 85.97,
"r_x3": 512.63,
"r_y3": 85.97,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 317.06,
"t": 97.92,
"r": 359.43,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 106.83,
"r_x1": 359.43,
"r_y1": 106.83,
"r_x2": 359.43,
"r_y2": 97.92,
"r_x3": 317.06,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 417.86,
"t": 97.62,
"r": 425.38,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 106.84,
"r_x1": 425.38,
"r_y1": 106.84,
"r_x2": 425.38,
"r_y2": 97.62,
"r_x3": 417.86,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 449.9,
"t": 97.62,
"r": 457.42,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.84,
"r_x1": 457.42,
"r_y1": 106.84,
"r_x2": 457.42,
"r_y2": 97.62,
"r_x3": 449.9,
"r_y3": 97.62,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 476.4,
"t": 97.92,
"r": 496.33,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.83,
"r_x1": 496.33,
"r_y1": 106.83,
"r_x2": 496.33,
"r_y2": 97.92,
"r_x3": 476.4,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 513.46,
"t": 97.92,
"r": 531.73,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.46,
"r_y0": 106.83,
"r_x1": 531.73,
"r_y1": 106.83,
"r_x2": 531.73,
"r_y2": 97.92,
"r_x3": 513.46,
"r_y3": 97.92,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 317.06,
"t": 109.88,
"r": 359.98,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 118.78,
"r_x1": 359.98,
"r_y1": 118.78,
"r_x2": 359.98,
"r_y2": 109.88,
"r_x3": 317.06,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 417.86,
"t": 109.58,
"r": 425.38,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 118.79,
"r_x1": 425.38,
"r_y1": 118.79,
"r_x2": 425.38,
"r_y2": 109.58,
"r_x3": 417.86,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 450.81,
"t": 109.58,
"r": 456.5,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.81,
"r_y0": 118.79,
"r_x1": 456.5,
"r_y1": 118.79,
"r_x2": 456.5,
"r_y2": 109.58,
"r_x3": 450.81,
"r_y3": 109.58,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 476.4,
"t": 109.88,
"r": 496.33,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.78,
"r_x1": 496.33,
"r_y1": 118.78,
"r_x2": 496.33,
"r_y2": 109.88,
"r_x3": 476.4,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 511.25,
"t": 109.88,
"r": 533.95,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.25,
"r_y0": 118.78,
"r_x1": 533.95,
"r_y1": 118.78,
"r_x2": 533.95,
"r_y2": 109.88,
"r_x3": 511.25,
"r_y3": 109.88,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 317.06,
"t": 121.83,
"r": 400.38,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 130.74,
"r_x1": 400.38,
"r_y1": 130.74,
"r_x2": 400.38,
"r_y2": 121.83,
"r_x3": 317.06,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 417.86,
"t": 121.53,
"r": 425.38,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 130.75,
"r_x1": 425.38,
"r_y1": 130.75,
"r_x2": 425.38,
"r_y2": 121.53,
"r_x3": 417.86,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 449.9,
"t": 121.53,
"r": 457.42,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.75,
"r_x1": 457.42,
"r_y1": 130.75,
"r_x2": 457.42,
"r_y2": 121.53,
"r_x3": 449.9,
"r_y3": 121.53,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 476.4,
"t": 121.83,
"r": 496.33,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.74,
"r_x1": 496.33,
"r_y1": 130.74,
"r_x2": 496.33,
"r_y2": 121.83,
"r_x3": 476.4,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 512.63,
"t": 121.83,
"r": 532.56,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 130.74,
"r_x1": 532.56,
"r_y1": 130.74,
"r_x2": 532.56,
"r_y2": 121.83,
"r_x3": 512.63,
"r_y3": 121.83,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 317.06,
"t": 133.79,
"r": 375.17,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 142.69,
"r_x1": 375.17,
"r_y1": 142.69,
"r_x2": 375.17,
"r_y2": 133.79,
"r_x3": 317.06,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 417.86,
"t": 133.49,
"r": 425.38,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 142.7,
"r_x1": 425.38,
"r_y1": 142.7,
"r_x2": 425.38,
"r_y2": 133.49,
"r_x3": 417.86,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 449.9,
"t": 133.49,
"r": 457.42,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.42,
"r_y1": 142.7,
"r_x2": 457.42,
"r_y2": 133.49,
"r_x3": 449.9,
"r_y3": 133.49,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 476.4,
"t": 133.79,
"r": 496.33,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.69,
"r_x1": 496.33,
"r_y1": 142.69,
"r_x2": 496.33,
"r_y2": 133.79,
"r_x3": 476.4,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 512.63,
"t": 133.79,
"r": 532.56,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 142.69,
"r_x1": 532.56,
"r_y1": 142.69,
"r_x2": 532.56,
"r_y2": 133.79,
"r_x3": 512.63,
"r_y3": 133.79,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 317.06,
"t": 145.74,
"r": 369.39,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.06,
"r_y0": 154.65,
"r_x1": 369.39,
"r_y1": 154.65,
"r_x2": 369.39,
"r_y2": 145.74,
"r_x3": 317.06,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 417.86,
"t": 145.44,
"r": 425.38,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.86,
"r_y0": 154.66,
"r_x1": 425.38,
"r_y1": 154.66,
"r_x2": 425.38,
"r_y2": 145.44,
"r_x3": 417.86,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 449.9,
"t": 145.44,
"r": 457.42,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.66,
"r_x1": 457.42,
"r_y1": 154.66,
"r_x2": 457.42,
"r_y2": 145.44,
"r_x3": 449.9,
"r_y3": 145.44,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 476.4,
"t": 145.74,
"r": 496.33,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.65,
"r_x1": 496.33,
"r_y1": 154.65,
"r_x2": 496.33,
"r_y2": 145.74,
"r_x3": 476.4,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 512.63,
"t": 145.74,
"r": 532.56,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.63,
"r_y0": 154.65,
"r_x1": 532.56,
"r_y1": 154.65,
"r_x2": 532.56,
"r_y2": 145.74,
"r_x3": 512.63,
"r_y3": 145.74,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 412.33,
"t": 73.61,
"r": 430.9,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Tags",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 442.86,
"t": 73.61,
"r": 464.45,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Bbox",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 477.79,
"t": 73.61,
"r": 494.94,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "Size",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 508.28,
"t": 73.61,
"r": 536.91,
"b": 82.52,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "Format",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 85.97,
"r": 361.64,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "PubTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 85.67,
"r": 425.38,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 85.67,
"r": 457.42,
"b": 94.88,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 85.97,
"r": 496.33,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "509k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 85.97,
"r": 532.56,
"b": 94.87,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 97.92,
"r": 359.43,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "FinTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 97.62,
"r": 425.38,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 97.62,
"r": 457.42,
"b": 106.84,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 97.92,
"r": 496.33,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "112k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.46,
"t": 97.92,
"r": 531.73,
"b": 106.83,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PDF",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 109.88,
"r": 359.98,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableBank",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 109.58,
"r": 425.38,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 450.81,
"t": 109.58,
"r": 456.5,
"b": 118.79,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 109.88,
"r": 496.33,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "145k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 511.25,
"t": 109.88,
"r": 533.95,
"b": 118.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "JPEG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 121.83,
"r": 400.38,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined-Tabnet(*)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 121.53,
"r": 425.38,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 121.53,
"r": 457.42,
"b": 130.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 121.83,
"r": 496.33,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "400k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 121.83,
"r": 532.56,
"b": 130.74,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 133.79,
"r": 375.17,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined(**)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 133.49,
"r": 425.38,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 133.49,
"r": 457.42,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 133.79,
"r": 496.33,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "500k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 133.79,
"r": 532.56,
"b": 142.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.06,
"t": 145.74,
"r": 369.39,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "SynthTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.86,
"t": 145.44,
"r": 425.38,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 145.44,
"r": 457.42,
"b": 154.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 145.74,
"r": 496.33,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "600k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.63,
"t": 145.74,
"r": 532.56,
"b": 154.65,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 9,
"page_no": 3,
"cluster": {
"id": 9,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 167.66,
"r": 545.12,
"b": 224.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.967,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 176.57,
"r_x1": 344.62,
"r_y1": 176.57,
"r_x2": 344.62,
"r_y2": 167.66,
"r_x3": 308.86,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "Table 1:",
"orig": "Table 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 361.08,
"r_y0": 176.57,
"r_x1": 380.45,
"r_y1": 176.57,
"r_x2": 380.45,
"r_y2": 167.66,
"r_x3": 361.08,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "Both",
"orig": "Both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.57,
"r_y0": 176.34,
"r_x1": 468.68,
"r_y1": 176.34,
"r_x2": 468.68,
"r_y2": 167.75,
"r_x3": 386.57,
"r_y3": 167.75,
"coord_origin": "TOPLEFT"
},
"text": "\u201cCombined-Tabnet\u201d",
"orig": "\u201cCombined-Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 176.57,
"r_x1": 489.18,
"r_y1": 176.57,
"r_x2": 489.18,
"r_y2": 167.66,
"r_x3": 474.8,
"r_y3": 167.66,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.3,
"r_y0": 176.34,
"r_x1": 545.11,
"r_y1": 176.34,
"r_x2": 545.11,
"r_y2": 167.75,
"r_x3": 495.3,
"r_y3": 167.75,
"coord_origin": "TOPLEFT"
},
"text": "\u201dCombined-",
"orig": "\u201dCombined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 188.29,
"r_x1": 341.16,
"r_y1": 188.29,
"r_x2": 341.16,
"r_y2": 179.71,
"r_x3": 308.86,
"r_y3": 179.71,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet\u201d",
"orig": "Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.46,
"r_y0": 188.52,
"r_x1": 545.11,
"r_y1": 188.52,
"r_x2": 545.11,
"r_y2": 179.62,
"r_x3": 343.46,
"r_y3": 179.62,
"coord_origin": "TOPLEFT"
},
"text": "are variations of the following: (*) The Combined-",
"orig": "are variations of the following: (*) The Combined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 200.48,
"r_x1": 545.12,
"r_y1": 200.48,
"r_x2": 545.12,
"r_y2": 191.57,
"r_x3": 308.86,
"r_y3": 191.57,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet dataset is the processed combination of PubTabNet",
"orig": "Tabnet dataset is the processed combination of PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 212.43,
"r_x1": 545.11,
"r_y1": 212.43,
"r_x2": 545.11,
"r_y2": 203.53,
"r_x3": 308.86,
"r_y3": 203.53,
"coord_origin": "TOPLEFT"
},
"text": "and Fintabnet. (**) The combined dataset is the processed",
"orig": "and Fintabnet. (**) The combined dataset is the processed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 224.39,
"r_x1": 523.93,
"r_y1": 224.39,
"r_x2": 523.93,
"r_y2": 215.48,
"r_x3": 308.86,
"r_y3": 215.48,
"coord_origin": "TOPLEFT"
},
"text": "combination of PubTabNet, Fintabnet and TableBank.",
"orig": "combination of PubTabNet, Fintabnet and TableBank.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 1: Both \"Combined-Tabnet\" and \"CombinedTabnet\" are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank."
},
{
"label": "text",
"id": 6,
"page_no": 3,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 308.86,
"t": 249.62,
"r": 545.12,
"b": 294.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.53,
"r_x1": 545.12,
"r_y1": 258.53,
"r_x2": 545.12,
"r_y2": 249.62,
"r_x3": 308.86,
"r_y3": 249.62,
"coord_origin": "TOPLEFT"
},
"text": "one adopts a colorful appearance with high contrast and the",
"orig": "one adopts a colorful appearance with high contrast and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.48,
"r_x1": 545.12,
"r_y1": 270.48,
"r_x2": 545.12,
"r_y2": 261.58,
"r_x3": 308.86,
"r_y3": 261.58,
"coord_origin": "TOPLEFT"
},
"text": "last one contains tables with sparse content. Lastly, we have",
"orig": "last one contains tables with sparse content. Lastly, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.44,
"r_x1": 545.12,
"r_y1": 282.44,
"r_x2": 545.12,
"r_y2": 273.53,
"r_x3": 308.86,
"r_y3": 273.53,
"coord_origin": "TOPLEFT"
},
"text": "combined all synthetic datasets into one big unified syn-",
"orig": "combined all synthetic datasets into one big unified syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.39,
"r_x1": 436.82,
"r_y1": 294.39,
"r_x2": 436.82,
"r_y2": 285.49,
"r_x3": 308.86,
"r_y3": 285.49,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset of 600k examples.",
"orig": "thetic dataset of 600k examples.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples."
},
{
"label": "text",
"id": 13,
"page_no": 3,
"cluster": {
"id": 13,
"label": "text",
"bbox": {
"l": 320.82,
"t": 297.77,
"r": 542.74,
"b": 306.68,
"coord_origin": "TOPLEFT"
},
"confidence": 0.904,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 306.68,
"r_x1": 542.74,
"r_y1": 306.68,
"r_x2": 542.74,
"r_y2": 297.77,
"r_x3": 320.82,
"r_y3": 297.77,
"coord_origin": "TOPLEFT"
},
"text": "Tab. 1 summarizes the various attributes of the datasets.",
"orig": "Tab. 1 summarizes the various attributes of the datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Tab. 1 summarizes the various attributes of the datasets."
},
{
"label": "section_header",
"id": 11,
"page_no": 3,
"cluster": {
"id": 11,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 321.18,
"r": 444.94,
"b": 331.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.947,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 331.93,
"r_x1": 316.28,
"r_y1": 331.93,
"r_x2": 316.28,
"r_y2": 321.18,
"r_x3": 308.86,
"r_y3": 321.18,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.18,
"r_y0": 331.93,
"r_x1": 444.94,
"r_y1": 331.93,
"r_x2": 444.94,
"r_y2": 321.18,
"r_x3": 326.18,
"r_y3": 321.18,
"coord_origin": "TOPLEFT"
},
"text": "The TableFormer model",
"orig": "The TableFormer model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. The TableFormer model"
},
{
"label": "text",
"id": 0,
"page_no": 3,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 341.94,
"r": 545.12,
"b": 446.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 350.85,
"r_x1": 545.11,
"r_y1": 350.85,
"r_x2": 545.11,
"r_y2": 341.94,
"r_x3": 320.82,
"r_y3": 341.94,
"coord_origin": "TOPLEFT"
},
"text": "Given the image of a table, TableFormer is able to pre-",
"orig": "Given the image of a table, TableFormer is able to pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 362.8,
"r_x1": 545.12,
"r_y1": 362.8,
"r_x2": 545.12,
"r_y2": 353.89,
"r_x3": 308.86,
"r_y3": 353.89,
"coord_origin": "TOPLEFT"
},
"text": "dict: 1) a sequence of tokens that represent the structure of",
"orig": "dict: 1) a sequence of tokens that represent the structure of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 374.76,
"r_x1": 545.12,
"r_y1": 374.76,
"r_x2": 545.12,
"r_y2": 365.85,
"r_x3": 308.86,
"r_y3": 365.85,
"coord_origin": "TOPLEFT"
},
"text": "a table, and 2) a bounding box coupled to a subset of those",
"orig": "a table, and 2) a bounding box coupled to a subset of those",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 386.71,
"r_x1": 545.12,
"r_y1": 386.71,
"r_x2": 545.12,
"r_y2": 377.8,
"r_x3": 308.86,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "tokens. The conversion of an image into a sequence of to-",
"orig": "tokens. The conversion of an image into a sequence of to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 398.67,
"r_x1": 545.12,
"r_y1": 398.67,
"r_x2": 545.12,
"r_y2": 389.76,
"r_x3": 308.86,
"r_y3": 389.76,
"coord_origin": "TOPLEFT"
},
"text": "kens is a well-known task [35, 16]. While attention is often",
"orig": "kens is a well-known task [35, 16]. While attention is often",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 410.62,
"r_x1": 545.12,
"r_y1": 410.62,
"r_x2": 545.12,
"r_y2": 401.71,
"r_x3": 308.86,
"r_y3": 401.71,
"coord_origin": "TOPLEFT"
},
"text": "used as an implicit method to associate each token of the",
"orig": "used as an implicit method to associate each token of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 422.58,
"r_x1": 545.12,
"r_y1": 422.58,
"r_x2": 545.12,
"r_y2": 413.67,
"r_x3": 308.86,
"r_y3": 413.67,
"coord_origin": "TOPLEFT"
},
"text": "sequence with a position in the original image, an explicit",
"orig": "sequence with a position in the original image, an explicit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 434.53,
"r_x1": 545.12,
"r_y1": 434.53,
"r_x2": 545.12,
"r_y2": 425.63,
"r_x3": 308.86,
"r_y3": 425.63,
"coord_origin": "TOPLEFT"
},
"text": "association between the individual table-cells and the image",
"orig": "association between the individual table-cells and the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 446.49,
"r_x1": 437.94,
"r_y1": 446.49,
"r_x2": 437.94,
"r_y2": 437.58,
"r_x3": 308.86,
"r_y3": 437.58,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes is also required.",
"orig": "bounding boxes is also required.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required."
},
{
"label": "section_header",
"id": 12,
"page_no": 3,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 457.69,
"r": 420.16,
"b": 467.55,
"coord_origin": "TOPLEFT"
},
"confidence": 0.938,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 467.55,
"r_x1": 323.14,
"r_y1": 467.55,
"r_x2": 323.14,
"r_y2": 457.69,
"r_x3": 308.86,
"r_y3": 457.69,
"coord_origin": "TOPLEFT"
},
"text": "4.1.",
"orig": "4.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 332.66,
"r_y0": 467.55,
"r_x1": 420.16,
"r_y1": 467.55,
"r_x2": 420.16,
"r_y2": 457.69,
"r_x3": 332.66,
"r_y3": 457.69,
"coord_origin": "TOPLEFT"
},
"text": "Model architecture.",
"orig": "Model architecture.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4.1. Model architecture."
},
{
"label": "text",
"id": 2,
"page_no": 3,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 476.77,
"r": 545.12,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 485.67,
"r_x1": 545.11,
"r_y1": 485.67,
"r_x2": 545.11,
"r_y2": 476.77,
"r_x3": 320.82,
"r_y3": 476.77,
"coord_origin": "TOPLEFT"
},
"text": "We now describe in detail the proposed method, which",
"orig": "We now describe in detail the proposed method, which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.63,
"r_x1": 509.02,
"r_y1": 497.63,
"r_x2": 509.02,
"r_y2": 488.72,
"r_x3": 308.86,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "is composed of three main components, see Fig.",
"orig": "is composed of three main components, see Fig.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.59,
"r_y0": 497.63,
"r_x1": 523.06,
"r_y1": 497.63,
"r_x2": 523.06,
"r_y2": 488.72,
"r_x3": 515.59,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 497.63,
"r_x1": 545.12,
"r_y1": 497.63,
"r_x2": 545.12,
"r_y2": 488.72,
"r_x3": 529.62,
"r_y3": 488.72,
"coord_origin": "TOPLEFT"
},
"text": "Our",
"orig": "Our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.35,
"r_x1": 406.35,
"r_y1": 509.35,
"r_x2": 406.35,
"r_y2": 500.76,
"r_x3": 308.86,
"r_y3": 500.76,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.87,
"r_y0": 509.58,
"r_x1": 545.11,
"r_y1": 509.58,
"r_x2": 545.11,
"r_y2": 500.68,
"r_x3": 408.87,
"r_y3": 500.68,
"coord_origin": "TOPLEFT"
},
"text": "encodes the input as a feature vec-",
"orig": "encodes the input as a feature vec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.54,
"r_x1": 409.39,
"r_y1": 521.54,
"r_x2": 409.39,
"r_y2": 512.63,
"r_x3": 308.86,
"r_y3": 512.63,
"coord_origin": "TOPLEFT"
},
"text": "tor of predefined length.",
"orig": "tor of predefined length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.73,
"r_y0": 521.54,
"r_x1": 545.12,
"r_y1": 521.54,
"r_x2": 545.12,
"r_y2": 512.63,
"r_x3": 416.73,
"r_y3": 512.63,
"coord_origin": "TOPLEFT"
},
"text": "The input feature vector of the",
"orig": "The input feature vector of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.49,
"r_x1": 436.19,
"r_y1": 533.49,
"r_x2": 436.19,
"r_y2": 524.59,
"r_x3": 308.86,
"r_y3": 524.59,
"coord_origin": "TOPLEFT"
},
"text": "encoded image is passed to the",
"orig": "encoded image is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.53,
"r_y0": 533.26,
"r_x1": 513.87,
"r_y1": 533.26,
"r_x2": 513.87,
"r_y2": 524.68,
"r_x3": 439.53,
"r_y3": 524.68,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 517.43,
"r_y0": 533.49,
"r_x1": 545.11,
"r_y1": 533.49,
"r_x2": 545.11,
"r_y2": 524.59,
"r_x3": 517.43,
"r_y3": 524.59,
"coord_origin": "TOPLEFT"
},
"text": "to pro-",
"orig": "to pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.45,
"r_x1": 545.12,
"r_y1": 545.45,
"r_x2": 545.12,
"r_y2": 536.54,
"r_x3": 308.86,
"r_y3": 536.54,
"coord_origin": "TOPLEFT"
},
"text": "duce a sequence of HTML tags that represent the structure",
"orig": "duce a sequence of HTML tags that represent the structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.4,
"r_x1": 358.55,
"r_y1": 557.4,
"r_x2": 358.55,
"r_y2": 548.5,
"r_x3": 308.86,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "of the table.",
"orig": "of the table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.19,
"r_y0": 557.4,
"r_x1": 545.12,
"r_y1": 557.4,
"r_x2": 545.12,
"r_y2": 548.5,
"r_x3": 365.19,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "With each prediction of an HTML standard",
"orig": "With each prediction of an HTML standard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.36,
"r_x1": 352.41,
"r_y1": 569.36,
"r_x2": 352.41,
"r_y2": 560.45,
"r_x3": 308.86,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "data cell (\u2018",
"orig": "data cell (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.41,
"r_y0": 569.14,
"r_x1": 360.16,
"r_y1": 569.14,
"r_x2": 360.16,
"r_y2": 560.29,
"r_x3": 352.41,
"r_y3": 560.29,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.16,
"r_y0": 569.36,
"r_x1": 367.91,
"r_y1": 569.36,
"r_x2": 367.91,
"r_y2": 560.45,
"r_x3": 360.16,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.91,
"r_y0": 569.14,
"r_x1": 375.66,
"r_y1": 569.14,
"r_x2": 375.66,
"r_y2": 560.29,
"r_x3": 367.91,
"r_y3": 560.29,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 375.66,
"r_y0": 569.36,
"r_x1": 545.11,
"r_y1": 569.36,
"r_x2": 545.11,
"r_y2": 560.45,
"r_x3": 375.66,
"r_y3": 560.45,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) the hidden state of that cell is passed to",
"orig": "\u2019) the hidden state of that cell is passed to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.31,
"r_x1": 545.11,
"r_y1": 581.31,
"r_x2": 545.11,
"r_y2": 572.41,
"r_x3": 308.86,
"r_y3": 572.41,
"coord_origin": "TOPLEFT"
},
"text": "the Cell BBox Decoder. As for spanning cells, such as row",
"orig": "the Cell BBox Decoder. As for spanning cells, such as row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.27,
"r_x1": 483.12,
"r_y1": 593.27,
"r_x2": 483.12,
"r_y2": 584.36,
"r_x3": 308.86,
"r_y3": 584.36,
"coord_origin": "TOPLEFT"
},
"text": "or column span, the tag is broken down to \u2018",
"orig": "or column span, the tag is broken down to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.12,
"r_y0": 593.05,
"r_x1": 490.87,
"r_y1": 593.05,
"r_x2": 490.87,
"r_y2": 584.2,
"r_x3": 483.12,
"r_y3": 584.2,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.87,
"r_y0": 593.27,
"r_x1": 545.11,
"r_y1": 593.27,
"r_x2": 545.11,
"r_y2": 584.36,
"r_x3": 490.87,
"r_y3": 584.36,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018rowspan=\u2019",
"orig": "\u2019, \u2018rowspan=\u2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.22,
"r_x1": 545.11,
"r_y1": 605.22,
"r_x2": 545.11,
"r_y2": 596.32,
"r_x3": 308.86,
"r_y3": 596.32,
"coord_origin": "TOPLEFT"
},
"text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.18,
"r_x1": 329.64,
"r_y1": 617.18,
"r_x2": 329.64,
"r_y2": 608.27,
"r_x3": 308.86,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "and \u2018",
"orig": "and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.65,
"r_y0": 616.96,
"r_x1": 337.39,
"r_y1": 616.96,
"r_x2": 337.39,
"r_y2": 608.11,
"r_x3": 329.65,
"r_y3": 608.11,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.39,
"r_y0": 617.18,
"r_x1": 468.59,
"r_y1": 617.18,
"r_x2": 468.59,
"r_y2": 608.27,
"r_x3": 337.39,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "\u2019. The hidden state attached to \u2018",
"orig": "\u2019. The hidden state attached to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.59,
"r_y0": 616.96,
"r_x1": 476.34,
"r_y1": 616.96,
"r_x2": 476.34,
"r_y2": 608.11,
"r_x3": 468.59,
"r_y3": 608.11,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.34,
"r_y0": 617.18,
"r_x1": 545.12,
"r_y1": 617.18,
"r_x2": 545.12,
"r_y2": 608.27,
"r_x3": 476.34,
"r_y3": 608.27,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 is passed to the",
"orig": "\u2019 is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.13,
"r_x1": 545.11,
"r_y1": 629.13,
"r_x2": 545.11,
"r_y2": 620.23,
"r_x3": 308.86,
"r_y3": 620.23,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder. A shared feed forward network (FFN)",
"orig": "Cell BBox Decoder. A shared feed forward network (FFN)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.09,
"r_x1": 545.12,
"r_y1": 641.09,
"r_x2": 545.12,
"r_y2": 632.18,
"r_x3": 308.86,
"r_y3": 632.18,
"coord_origin": "TOPLEFT"
},
"text": "receives the hidden states from the Structure Decoder, to",
"orig": "receives the hidden states from the Structure Decoder, to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.04,
"r_x1": 545.12,
"r_y1": 653.04,
"r_x2": 545.12,
"r_y2": 644.14,
"r_x3": 308.86,
"r_y3": 644.14,
"coord_origin": "TOPLEFT"
},
"text": "provide the final detection predictions of the bounding box",
"orig": "provide the final detection predictions of the bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.0,
"r_x1": 449.42,
"r_y1": 665.0,
"r_x2": 449.42,
"r_y2": 656.09,
"r_x3": 308.86,
"r_y3": 656.09,
"coord_origin": "TOPLEFT"
},
"text": "coordinates and their classification.",
"orig": "coordinates and their classification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification."
},
{
"label": "text",
"id": 7,
"page_no": 3,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 308.86,
"t": 668.26,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.979,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 677.22,
"r_x1": 431.91,
"r_y1": 677.22,
"r_x2": 431.91,
"r_y2": 668.26,
"r_x3": 320.82,
"r_y3": 668.26,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network.",
"orig": "CNN Backbone Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 677.29,
"r_x1": 545.11,
"r_y1": 677.29,
"r_x2": 545.11,
"r_y2": 668.38,
"r_x3": 439.5,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "A ResNet-18 CNN is the",
"orig": "A ResNet-18 CNN is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.11,
"r_y1": 689.24,
"r_x2": 545.11,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "backbone that receives the table image and encodes it as a",
"orig": "backbone that receives the table image and encodes it as a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "vector of predefined length. The network has been modified",
"orig": "vector of predefined length. The network has been modified",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "by removing the linear and pooling layer, as we are not per-",
"orig": "by removing the linear and pooling layer, as we are not per-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-"
}
],
"headers": [
{
"label": "page_footer",
"id": 14,
"page_no": 3,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4"
}
]
}
},
{
"page_no": 4,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.69,
"r_y0": 125.63,
"r_x1": 84.93,
"r_y1": 125.63,
"r_x2": 84.93,
"r_y2": 122.44,
"r_x3": 81.69,
"r_y3": 122.44,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.55,
"r_y0": 125.63,
"r_x1": 93.03,
"r_y1": 125.63,
"r_x2": 93.03,
"r_y2": 122.44,
"r_x3": 86.55,
"r_y3": 122.44,
"coord_origin": "TOPLEFT"
},
"text": "Item",
"orig": "Item",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.5,
"r_y0": 118.44,
"r_x1": 115.35,
"r_y1": 118.44,
"r_x2": 115.35,
"r_y2": 115.25,
"r_x3": 102.5,
"r_y3": 115.25,
"coord_origin": "TOPLEFT"
},
"text": "Amount",
"orig": "Amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.14,
"r_y0": 118.4,
"r_x1": 93.29,
"r_y1": 118.4,
"r_x2": 93.29,
"r_y2": 115.21,
"r_x3": 82.14,
"r_y3": 115.21,
"coord_origin": "TOPLEFT"
},
"text": "Names",
"orig": "Names",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.75,
"r_y0": 125.63,
"r_x1": 104.31,
"r_y1": 125.63,
"r_x2": 104.31,
"r_y2": 122.44,
"r_x3": 96.75,
"r_y3": 122.44,
"coord_origin": "TOPLEFT"
},
"text": "1000",
"orig": "1000",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.75,
"r_y0": 130.93,
"r_x1": 102.42,
"r_y1": 130.93,
"r_x2": 102.42,
"r_y2": 127.74,
"r_x3": 96.75,
"r_y3": 127.74,
"coord_origin": "TOPLEFT"
},
"text": "500",
"orig": "500",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.75,
"r_y0": 136.64,
"r_x1": 104.31,
"r_y1": 136.64,
"r_x2": 104.31,
"r_y2": 133.46,
"r_x3": 96.75,
"r_y3": 133.46,
"coord_origin": "TOPLEFT"
},
"text": "3500",
"orig": "3500",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.75,
"r_y0": 142.36,
"r_x1": 102.42,
"r_y1": 142.36,
"r_x2": 102.42,
"r_y2": 139.17,
"r_x3": 96.75,
"r_y3": 139.17,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.66,
"r_y0": 125.63,
"r_x1": 116.14,
"r_y1": 125.63,
"r_x2": 116.14,
"r_y2": 122.44,
"r_x3": 110.66,
"r_y3": 122.44,
"coord_origin": "TOPLEFT"
},
"text": "unit",
"orig": "unit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.66,
"r_y0": 130.93,
"r_x1": 116.14,
"r_y1": 130.93,
"r_x2": 116.14,
"r_y2": 127.74,
"r_x3": 110.66,
"r_y3": 127.74,
"coord_origin": "TOPLEFT"
},
"text": "unit",
"orig": "unit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.66,
"r_y0": 136.64,
"r_x1": 116.14,
"r_y1": 136.64,
"r_x2": 116.14,
"r_y2": 133.46,
"r_x3": 110.66,
"r_y3": 133.46,
"coord_origin": "TOPLEFT"
},
"text": "unit",
"orig": "unit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.66,
"r_y0": 142.36,
"r_x1": 116.14,
"r_y1": 142.36,
"r_x2": 116.14,
"r_y2": 139.17,
"r_x3": 110.66,
"r_y3": 139.17,
"coord_origin": "TOPLEFT"
},
"text": "unit",
"orig": "unit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.69,
"r_y0": 130.93,
"r_x1": 84.93,
"r_y1": 130.93,
"r_x2": 84.93,
"r_y2": 127.74,
"r_x3": 81.69,
"r_y3": 127.74,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.55,
"r_y0": 130.93,
"r_x1": 93.03,
"r_y1": 130.93,
"r_x2": 93.03,
"r_y2": 127.74,
"r_x3": 86.55,
"r_y3": 127.74,
"coord_origin": "TOPLEFT"
},
"text": "Item",
"orig": "Item",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.69,
"r_y0": 136.64,
"r_x1": 84.93,
"r_y1": 136.64,
"r_x2": 84.93,
"r_y2": 133.46,
"r_x3": 81.69,
"r_y3": 133.46,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.55,
"r_y0": 136.64,
"r_x1": 93.03,
"r_y1": 136.64,
"r_x2": 93.03,
"r_y2": 133.46,
"r_x3": 86.55,
"r_y3": 133.46,
"coord_origin": "TOPLEFT"
},
"text": "Item",
"orig": "Item",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.69,
"r_y0": 142.36,
"r_x1": 84.93,
"r_y1": 142.36,
"r_x2": 84.93,
"r_y2": 139.17,
"r_x3": 81.69,
"r_y3": 139.17,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.55,
"r_y0": 142.36,
"r_x1": 93.03,
"r_y1": 142.36,
"r_x2": 93.03,
"r_y2": 139.17,
"r_x3": 86.55,
"r_y3": 139.17,
"coord_origin": "TOPLEFT"
},
"text": "Item",
"orig": "Item",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.08,
"r_y0": 96.24,
"r_x1": 113.94,
"r_y1": 96.24,
"r_x2": 113.94,
"r_y2": 90.5,
"r_x3": 88.08,
"r_y3": 90.5,
"coord_origin": "TOPLEFT"
},
"text": "Extracted",
"orig": "Extracted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.81,
"r_y0": 103.38,
"r_x1": 119.21,
"r_y1": 103.38,
"r_x2": 119.21,
"r_y2": 97.64,
"r_x3": 82.81,
"r_y3": 97.64,
"coord_origin": "TOPLEFT"
},
"text": "Table Images",
"orig": "Table Images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.94,
"r_y0": 106.34,
"r_x1": 180.01,
"r_y1": 106.34,
"r_x2": 180.01,
"r_y2": 100.6,
"r_x3": 143.94,
"r_y3": 100.6,
"coord_origin": "TOPLEFT"
},
"text": "Standardized",
"orig": "Standardized",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 151.94,
"r_y0": 113.48,
"r_x1": 172.01,
"r_y1": 113.48,
"r_x2": 172.01,
"r_y2": 107.74,
"r_x3": 151.94,
"r_y3": 107.74,
"coord_origin": "TOPLEFT"
},
"text": "Images",
"orig": "Images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.77,
"r_y0": 86.67,
"r_x1": 266.4,
"r_y1": 86.67,
"r_x2": 266.4,
"r_y2": 80.93,
"r_x3": 251.77,
"r_y3": 80.93,
"coord_origin": "TOPLEFT"
},
"text": "BBox",
"orig": "BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 247.52,
"r_y0": 91.77,
"r_x1": 270.65,
"r_y1": 91.77,
"r_x2": 270.65,
"r_y2": 86.03,
"r_x3": 247.52,
"r_y3": 86.03,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.04,
"r_y0": 84.3,
"r_x1": 352.13,
"r_y1": 84.3,
"r_x2": 352.13,
"r_y2": 78.56,
"r_x3": 331.04,
"r_y3": 78.56,
"coord_origin": "TOPLEFT"
},
"text": "BBoxes",
"orig": "BBoxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 390.56,
"r_y0": 101.77,
"r_x1": 431.73,
"r_y1": 101.77,
"r_x2": 431.73,
"r_y2": 96.03,
"r_x3": 390.56,
"r_y3": 96.03,
"coord_origin": "TOPLEFT"
},
"text": "BBoxes can be",
"orig": "BBoxes can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.82,
"r_y0": 107.89,
"r_x1": 435.47,
"r_y1": 107.89,
"r_x2": 435.47,
"r_y2": 102.15,
"r_x3": 386.82,
"r_y3": 102.15,
"coord_origin": "TOPLEFT"
},
"text": "traced back to the",
"orig": "traced back to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 114.01,
"r_x1": 433.6,
"r_y1": 114.01,
"r_x2": 433.6,
"r_y2": 108.27,
"r_x3": 388.7,
"r_y3": 108.27,
"coord_origin": "TOPLEFT"
},
"text": "original image to",
"orig": "original image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.08,
"r_y0": 120.13,
"r_x1": 431.23,
"r_y1": 120.13,
"r_x2": 431.23,
"r_y2": 114.39,
"r_x3": 391.08,
"r_y3": 114.39,
"coord_origin": "TOPLEFT"
},
"text": "extract content",
"orig": "extract content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.23,
"r_y0": 157.43,
"r_x1": 498.82,
"r_y1": 157.43,
"r_x2": 498.82,
"r_y2": 151.69,
"r_x3": 431.23,
"r_y3": 151.69,
"coord_origin": "TOPLEFT"
},
"text": "Structure Tags sequence",
"orig": "Structure Tags sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.17,
"r_y0": 163.55,
"r_x1": 498.88,
"r_y1": 163.55,
"r_x2": 498.88,
"r_y2": 157.81,
"r_x3": 431.17,
"r_y3": 157.81,
"coord_origin": "TOPLEFT"
},
"text": "provide full description of",
"orig": "provide full description of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.53,
"r_y0": 169.67,
"r_x1": 489.52,
"r_y1": 169.67,
"r_x2": 489.52,
"r_y2": 163.93,
"r_x3": 440.53,
"r_y3": 163.93,
"coord_origin": "TOPLEFT"
},
"text": "the table structure",
"orig": "the table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.37,
"r_y0": 183.99,
"r_x1": 367.72,
"r_y1": 183.99,
"r_x2": 367.72,
"r_y2": 178.25,
"r_x3": 328.37,
"r_y3": 178.25,
"coord_origin": "TOPLEFT"
},
"text": "Structure Tags",
"orig": "Structure Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.84,
"r_y0": 129.65,
"r_x1": 373.68,
"r_y1": 129.65,
"r_x2": 373.68,
"r_y2": 123.91,
"r_x3": 331.84,
"r_y3": 123.91,
"coord_origin": "TOPLEFT"
},
"text": "BBoxes in sync",
"orig": "BBoxes in sync",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.84,
"r_y0": 134.75,
"r_x1": 381.18,
"r_y1": 134.75,
"r_x2": 381.18,
"r_y2": 129.01,
"r_x3": 331.84,
"r_y3": 129.01,
"coord_origin": "TOPLEFT"
},
"text": "with tag sequence",
"orig": "with tag sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.63,
"r_y0": 93.86,
"r_x1": 219.42,
"r_y1": 93.86,
"r_x2": 219.42,
"r_y2": 88.12,
"r_x3": 196.63,
"r_y3": 88.12,
"coord_origin": "TOPLEFT"
},
"text": "Encoder",
"orig": "Encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.67,
"r_y0": 135.24,
"r_x1": 271.5,
"r_y1": 135.24,
"r_x2": 271.5,
"r_y2": 129.49,
"r_x3": 246.67,
"r_y3": 129.49,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 247.52,
"r_y0": 140.34,
"r_x1": 270.65,
"r_y1": 140.34,
"r_x2": 270.65,
"r_y2": 134.59,
"r_x3": 247.52,
"r_y3": 134.59,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.63,
"r_y0": 94.76,
"r_x1": 365.55,
"r_y1": 94.76,
"r_x2": 365.55,
"r_y2": 89.02,
"r_x3": 330.63,
"r_y3": 89.02,
"coord_origin": "TOPLEFT"
},
"text": "[x1, y2, x2, y2]",
"orig": "[x1, y2, x2, y2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.63,
"r_y0": 102.92,
"r_x1": 370.23,
"r_y1": 102.92,
"r_x2": 370.23,
"r_y2": 97.18,
"r_x3": 330.63,
"r_y3": 97.18,
"coord_origin": "TOPLEFT"
},
"text": "[x1', y2', x2', y2']",
"orig": "[x1', y2', x2', y2']",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.63,
"r_y0": 111.08,
"r_x1": 374.51,
"r_y1": 111.08,
"r_x2": 374.51,
"r_y2": 105.34,
"r_x3": 330.63,
"r_y3": 105.34,
"coord_origin": "TOPLEFT"
},
"text": "[x1'', y2'', x2'', y2'']",
"orig": "[x1'', y2'', x2'', y2'']",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.63,
"r_y0": 119.24,
"r_x1": 335.73,
"r_y1": 119.24,
"r_x2": 335.73,
"r_y2": 113.5,
"r_x3": 330.63,
"r_y3": 113.5,
"coord_origin": "TOPLEFT"
},
"text": "...",
"orig": "...",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 322.31,
"r_y0": 146.58,
"r_x1": 335.06,
"r_y1": 146.58,
"r_x2": 335.06,
"r_y2": 141.79,
"r_x3": 322.31,
"r_y3": 141.79,
"coord_origin": "TOPLEFT"
},
"text": "
",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 322.31,
"t": 163.21,
"r": 335.06,
"b": 168.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 322.31,
"r_y0": 168.0,
"r_x1": 335.06,
"r_y1": 168.0,
"r_x2": 335.06,
"r_y2": 163.21,
"r_x3": 322.31,
"r_y3": 163.21,
"coord_origin": "TOPLEFT"
},
"text": "",
"orig": " | ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 343.56,
"t": 163.21,
"r": 374.74,
"b": 168.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.56,
"r_y0": 168.0,
"r_x1": 374.74,
"r_y1": 168.0,
"r_x2": 374.74,
"r_y2": 163.21,
"r_x3": 343.56,
"r_y3": 163.21,
"coord_origin": "TOPLEFT"
},
"text": " | ...",
"orig": " | ...",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 322.31,
"t": 170.35,
"r": 326.56,
"b": 175.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 322.31,
"r_y0": 175.14,
"r_x1": 326.56,
"r_y1": 175.14,
"r_x2": 326.56,
"r_y2": 170.35,
"r_x3": 322.31,
"r_y3": 170.35,
"coord_origin": "TOPLEFT"
},
"text": "...",
"orig": "...",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 323.51,
"t": 89.67,
"r": 326.91,
"b": 95.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 323.51,
"r_y0": 95.41,
"r_x1": 326.91,
"r_y1": 95.41,
"r_x2": 326.91,
"r_y2": 89.67,
"r_x3": 323.51,
"r_y3": 89.67,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 323.72,
"t": 97.79,
"r": 327.12,
"b": 103.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 323.72,
"r_y0": 103.53,
"r_x1": 327.12,
"r_y1": 103.53,
"r_x2": 327.12,
"r_y2": 97.79,
"r_x3": 323.72,
"r_y3": 97.79,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 323.72,
"t": 105.99,
"r": 327.12,
"b": 111.73,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 323.72,
"r_y0": 111.73,
"r_x1": 327.12,
"r_y1": 111.73,
"r_x2": 327.12,
"r_y2": 105.99,
"r_x3": 323.72,
"r_y3": 105.99,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 401.48,
"t": 148.55,
"r": 404.88,
"b": 154.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.48,
"r_y0": 154.29,
"r_x1": 404.88,
"r_y1": 154.29,
"r_x2": 404.88,
"r_y2": 148.55,
"r_x3": 401.48,
"r_y3": 148.55,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 337.7,
"t": 162.68,
"r": 341.1,
"b": 168.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.7,
"r_y0": 168.43,
"r_x1": 341.1,
"r_y1": 168.43,
"r_x2": 341.1,
"r_y2": 162.68,
"r_x3": 337.7,
"r_y3": 162.68,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 454.46,
"t": 104.55,
"r": 457.87,
"b": 110.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.46,
"r_y0": 110.29,
"r_x1": 457.87,
"r_y1": 110.29,
"r_x2": 457.87,
"r_y2": 104.55,
"r_x3": 454.46,
"r_y3": 104.55,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 493.33,
"t": 91.1,
"r": 496.73,
"b": 96.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.33,
"r_y0": 96.84,
"r_x1": 496.73,
"r_y1": 96.84,
"r_x2": 496.73,
"r_y2": 91.1,
"r_x3": 493.33,
"r_y3": 91.1,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 454.08,
"t": 90.57,
"r": 457.49,
"b": 96.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.08,
"r_y0": 96.31,
"r_x1": 457.49,
"r_y1": 96.31,
"r_x2": 457.49,
"r_y2": 90.57,
"r_x3": 454.08,
"r_y3": 90.57,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 6,
"page_no": 4,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 203.99,
"r": 545.11,
"b": 224.97,
"coord_origin": "TOPLEFT"
},
"confidence": 0.968,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 213.01,
"r_x1": 86.88,
"r_y1": 213.01,
"r_x2": 86.88,
"r_y2": 204.11,
"r_x3": 50.11,
"r_y3": 204.11,
"coord_origin": "TOPLEFT"
},
"text": "Figure 3:",
"orig": "Figure 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.02,
"r_y0": 212.94,
"r_x1": 149.85,
"r_y1": 212.94,
"r_x2": 149.85,
"r_y2": 203.99,
"r_x3": 94.02,
"r_y3": 203.99,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.86,
"r_y0": 213.01,
"r_x1": 545.11,
"r_y1": 213.01,
"r_x2": 545.11,
"r_y2": 204.11,
"r_x3": 152.86,
"r_y3": 204.11,
"coord_origin": "TOPLEFT"
},
"text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are",
"orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 224.97,
"r_x1": 436.01,
"r_y1": 224.97,
"r_x2": 436.01,
"r_y2": 216.06,
"r_x3": 50.11,
"r_y3": 216.06,
"coord_origin": "TOPLEFT"
},
"text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.",
"orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 3: TableFormer takes in an image of the PDF and creates bounding box and HTML structure predictions that are synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure."
},
{
"label": "picture",
"id": 5,
"page_no": 4,
"cluster": {
"id": 5,
"label": "picture",
"bbox": {
"l": 53.03,
"t": 257.67,
"r": 285.37,
"b": 507.67,
"coord_origin": "TOPLEFT"
},
"confidence": 0.972,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.25,
"r_y0": 264.17,
"r_x1": 101.76,
"r_y1": 264.17,
"r_x2": 101.76,
"r_y2": 258.21,
"r_x3": 74.25,
"r_y3": 258.21,
"coord_origin": "TOPLEFT"
},
"text": "Input Image",
"orig": "Input Image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.3,
"r_y0": 264.31,
"r_x1": 157.84,
"r_y1": 264.31,
"r_x2": 157.84,
"r_y2": 258.35,
"r_x3": 122.3,
"r_y3": 258.35,
"coord_origin": "TOPLEFT"
},
"text": "Tokenised Tags",
"orig": "Tokenised Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.55,
"r_y0": 377.05,
"r_x1": 125.68,
"r_y1": 377.05,
"r_x2": 125.68,
"r_y2": 371.39,
"r_x3": 78.55,
"r_y3": 371.39,
"coord_origin": "TOPLEFT"
},
"text": "Multi-Head Attention",
"orig": "Multi-Head Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.51,
"r_y0": 396.98,
"r_x1": 84.64,
"r_y1": 396.98,
"r_x2": 84.64,
"r_y2": 391.32,
"r_x3": 78.51,
"r_y3": 391.32,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.53,
"r_y0": 396.98,
"r_x1": 125.11,
"r_y1": 396.98,
"r_x2": 125.11,
"r_y2": 391.32,
"r_x3": 116.53,
"r_y3": 391.32,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.02,
"r_y0": 430.12,
"r_x1": 127.92,
"r_y1": 430.12,
"r_x2": 127.92,
"r_y2": 424.45,
"r_x3": 76.02,
"r_y3": 424.45,
"coord_origin": "TOPLEFT"
},
"text": "Feed Forward Network",
"orig": "Feed Forward Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.38,
"r_y0": 450.55,
"r_x1": 84.51,
"r_y1": 450.55,
"r_x2": 84.51,
"r_y2": 444.89,
"r_x3": 78.38,
"r_y3": 444.89,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.4,
"r_y0": 450.55,
"r_x1": 124.98,
"r_y1": 450.55,
"r_x2": 124.98,
"r_y2": 444.89,
"r_x3": 116.4,
"r_y3": 444.89,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 167.47,
"r_y0": 468.11,
"r_x1": 181.63,
"r_y1": 468.11,
"r_x2": 181.63,
"r_y2": 462.44,
"r_x3": 167.47,
"r_y3": 462.44,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 165.61,
"r_y0": 484.13,
"r_x1": 184.43,
"r_y1": 484.13,
"r_x2": 184.43,
"r_y2": 478.47,
"r_x3": 165.61,
"r_y3": 478.47,
"coord_origin": "TOPLEFT"
},
"text": "Softmax",
"orig": "Softmax",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.32,
"r_y0": 330.22,
"r_x1": 132.92,
"r_y1": 330.22,
"r_x2": 132.92,
"r_y2": 324.26,
"r_x3": 65.32,
"r_y3": 324.26,
"coord_origin": "TOPLEFT"
},
"text": "CNN BACKBONE ENCODER",
"orig": "CNN BACKBONE ENCODER",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.51,
"r_y0": 274.73,
"r_x1": 162.99,
"r_y1": 274.73,
"r_x2": 162.99,
"r_y2": 269.66,
"r_x3": 119.51,
"r_y3": 269.66,
"coord_origin": "TOPLEFT"
},
"text": "[30, 1, 2, 3, 4, \u2026 3, ",
"orig": "[30, 1, 2, 3, 4, \u2026 3, ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.73,
"r_y0": 279.98,
"r_x1": 151.41,
"r_y1": 279.98,
"r_x2": 151.41,
"r_y2": 274.91,
"r_x3": 128.73,
"r_y3": 274.91,
"coord_origin": "TOPLEFT"
},
"text": "4, 5, 8, 31]",
"orig": "4, 5, 8, 31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.43,
"r_y0": 344.27,
"r_x1": 80.27,
"r_y1": 344.27,
"r_x2": 80.27,
"r_y2": 338.96,
"r_x3": 60.43,
"r_y3": 338.96,
"coord_origin": "TOPLEFT"
},
"text": "Positional ",
"orig": "Positional ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.6,
"r_y0": 348.7,
"r_x1": 78.85,
"r_y1": 348.7,
"r_x2": 78.85,
"r_y2": 343.39,
"r_x3": 60.6,
"r_y3": 343.39,
"coord_origin": "TOPLEFT"
},
"text": "Encoding",
"orig": "Encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.83,
"r_y0": 298.69,
"r_x1": 154.66,
"r_y1": 298.69,
"r_x2": 154.66,
"r_y2": 293.38,
"r_x3": 134.83,
"r_y3": 293.38,
"coord_origin": "TOPLEFT"
},
"text": "Positional ",
"orig": "Positional ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.99,
"r_y0": 303.11,
"r_x1": 153.25,
"r_y1": 303.11,
"r_x2": 153.25,
"r_y2": 297.8,
"r_x3": 134.99,
"r_y3": 297.8,
"coord_origin": "TOPLEFT"
},
"text": "Encoding",
"orig": "Encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.55,
"r_y0": 351.02,
"r_x1": 197.15,
"r_y1": 351.02,
"r_x2": 197.15,
"r_y2": 345.36,
"r_x3": 150.55,
"r_y3": 345.36,
"coord_origin": "TOPLEFT"
},
"text": "Add & Normalisation",
"orig": "Add & Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.55,
"r_y0": 400.09,
"r_x1": 156.68,
"r_y1": 400.09,
"r_x2": 156.68,
"r_y2": 394.42,
"r_x3": 150.55,
"r_y3": 394.42,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.57,
"r_y0": 400.09,
"r_x1": 197.15,
"r_y1": 400.09,
"r_x2": 197.15,
"r_y2": 394.42,
"r_x3": 188.57,
"r_y3": 394.42,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.19,
"r_y0": 381.33,
"r_x1": 197.32,
"r_y1": 381.33,
"r_x2": 197.32,
"r_y2": 375.67,
"r_x3": 150.19,
"r_y3": 375.67,
"coord_origin": "TOPLEFT"
},
"text": "Multi-Head Attention",
"orig": "Multi-Head Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.55,
"r_y0": 445.91,
"r_x1": 156.68,
"r_y1": 445.91,
"r_x2": 156.68,
"r_y2": 440.25,
"r_x3": 150.55,
"r_y3": 440.25,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.57,
"r_y0": 445.91,
"r_x1": 197.15,
"r_y1": 445.91,
"r_x2": 197.15,
"r_y2": 440.25,
"r_x3": 188.57,
"r_y3": 440.25,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.86,
"r_y0": 427.76,
"r_x1": 199.76,
"r_y1": 427.76,
"r_x2": 199.76,
"r_y2": 422.09,
"r_x3": 147.86,
"r_y3": 422.09,
"coord_origin": "TOPLEFT"
},
"text": "Feed Forward Network",
"orig": "Feed Forward Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.57,
"r_y0": 319.92,
"r_x1": 255.73,
"r_y1": 319.92,
"r_x2": 255.73,
"r_y2": 314.26,
"r_x3": 241.57,
"r_y3": 314.26,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.92,
"r_y0": 367.03,
"r_x1": 256.08,
"r_y1": 367.03,
"r_x2": 256.08,
"r_y2": 361.36,
"r_x3": 241.92,
"r_y3": 361.36,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.05,
"r_y0": 342.28,
"r_x1": 248.72,
"r_y1": 342.28,
"r_x2": 248.72,
"r_y2": 336.62,
"r_x3": 228.05,
"r_y3": 336.62,
"coord_origin": "TOPLEFT"
},
"text": "Attention",
"orig": "Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.29,
"r_y0": 342.28,
"r_x1": 269.39,
"r_y1": 342.28,
"r_x2": 269.39,
"r_y2": 336.62,
"r_x3": 246.29,
"r_y3": 336.62,
"coord_origin": "TOPLEFT"
},
"text": "Network",
"orig": "Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.45,
"r_y0": 410.81,
"r_x1": 238.74,
"r_y1": 410.81,
"r_x2": 238.74,
"r_y2": 405.15,
"r_x3": 228.45,
"r_y3": 405.15,
"coord_origin": "TOPLEFT"
},
"text": "MLP",
"orig": "MLP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.3,
"r_y0": 410.87,
"r_x1": 271.78,
"r_y1": 410.87,
"r_x2": 271.78,
"r_y2": 405.2,
"r_x3": 256.3,
"r_y3": 405.2,
"coord_origin": "TOPLEFT"
},
"text": "Linear ",
"orig": "Linear ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.55,
"r_y0": 387.88,
"r_x1": 258.09,
"r_y1": 387.88,
"r_x2": 258.09,
"r_y2": 382.21,
"r_x3": 239.55,
"r_y3": 382.21,
"coord_origin": "TOPLEFT"
},
"text": "Sigmoid",
"orig": "Sigmoid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.15,
"r_y0": 449.78,
"r_x1": 59.51,
"r_y1": 449.78,
"r_x2": 59.51,
"r_y2": 384.87,
"r_x3": 54.15,
"r_y3": 384.87,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Encoder Network",
"orig": "Transformer Encoder Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.24,
"r_y0": 378.45,
"r_x1": 59.3,
"r_y1": 378.45,
"r_x2": 59.3,
"r_y2": 373.81,
"r_x3": 54.24,
"r_y3": 373.81,
"coord_origin": "TOPLEFT"
},
"text": "x2",
"orig": "x2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.3,
"r_y0": 490.37,
"r_x1": 122.16,
"r_y1": 490.37,
"r_x2": 122.16,
"r_y2": 484.53,
"r_x3": 85.3,
"r_y3": 484.53,
"coord_origin": "TOPLEFT"
},
"text": "Encoded Output",
"orig": "Encoded Output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.67,
"r_y0": 285.46,
"r_x1": 265.32,
"r_y1": 285.46,
"r_x2": 265.32,
"r_y2": 279.55,
"r_x3": 229.67,
"r_y3": 279.55,
"coord_origin": "TOPLEFT"
},
"text": "Encoded Output",
"orig": "Encoded Output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.17,
"r_y0": 506.13,
"r_x1": 190.42,
"r_y1": 506.13,
"r_x2": 190.42,
"r_y2": 500.3,
"r_x3": 157.17,
"r_y3": 500.3,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Tags",
"orig": "Predicted Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.82,
"r_y0": 443.89,
"r_x1": 270.78,
"r_y1": 443.89,
"r_x2": 270.78,
"r_y2": 438.06,
"r_x3": 227.82,
"r_y3": 438.06,
"coord_origin": "TOPLEFT"
},
"text": "Bounding Boxes & ",
"orig": "Bounding Boxes & ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.7,
"r_y0": 449.89,
"r_x1": 263.51,
"r_y1": 449.89,
"r_x2": 263.51,
"r_y2": 444.06,
"r_x3": 233.7,
"r_y3": 444.06,
"coord_origin": "TOPLEFT"
},
"text": "Classification",
"orig": "Classification",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.75,
"r_y0": 298.76,
"r_x1": 212.16,
"r_y1": 298.76,
"r_x2": 212.16,
"r_y2": 293.4,
"r_x3": 184.75,
"r_y3": 293.4,
"coord_origin": "TOPLEFT"
},
"text": "Transformer ",
"orig": "Transformer ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.91,
"r_y0": 304.51,
"r_x1": 216.74,
"r_y1": 304.51,
"r_x2": 216.74,
"r_y2": 299.15,
"r_x3": 178.91,
"r_y3": 299.15,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Network",
"orig": "Decoder Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 194.25,
"r_y0": 287.85,
"r_x1": 198.89,
"r_y1": 287.85,
"r_x2": 198.89,
"r_y2": 282.78,
"r_x3": 194.25,
"r_y3": 282.78,
"coord_origin": "TOPLEFT"
},
"text": "x4",
"orig": "x4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.46,
"r_y0": 277.83,
"r_x1": 276.47,
"r_y1": 277.83,
"r_x2": 276.47,
"r_y2": 271.87,
"r_x3": 221.46,
"r_y3": 271.87,
"coord_origin": "TOPLEFT"
},
"text": "CELL BBOX DECODER",
"orig": "CELL BBOX DECODER",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 151.65,
"r_y0": 329.1,
"r_x1": 197.29,
"r_y1": 329.1,
"r_x2": 197.29,
"r_y2": 323.44,
"r_x3": 151.65,
"r_y3": 323.44,
"coord_origin": "TOPLEFT"
},
"text": "Masked Multi-Head ",
"orig": "Masked Multi-Head ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 163.43,
"r_y0": 335.1,
"r_x1": 184.19,
"r_y1": 335.1,
"r_x2": 184.19,
"r_y2": 329.44,
"r_x3": 163.43,
"r_y3": 329.44,
"coord_origin": "TOPLEFT"
},
"text": "Attention",
"orig": "Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 70,
"label": "text",
"bbox": {
"l": 74.25,
"t": 258.21,
"r": 101.76,
"b": 264.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.25,
"r_y0": 264.17,
"r_x1": 101.76,
"r_y1": 264.17,
"r_x2": 101.76,
"r_y2": 258.21,
"r_x3": 74.25,
"r_y3": 258.21,
"coord_origin": "TOPLEFT"
},
"text": "Input Image",
"orig": "Input Image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 122.3,
"t": 258.35,
"r": 157.84,
"b": 264.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.3,
"r_y0": 264.31,
"r_x1": 157.84,
"r_y1": 264.31,
"r_x2": 157.84,
"r_y2": 258.35,
"r_x3": 122.3,
"r_y3": 258.35,
"coord_origin": "TOPLEFT"
},
"text": "Tokenised Tags",
"orig": "Tokenised Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 78.55,
"t": 371.39,
"r": 125.68,
"b": 377.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.55,
"r_y0": 377.05,
"r_x1": 125.68,
"r_y1": 377.05,
"r_x2": 125.68,
"r_y2": 371.39,
"r_x3": 78.55,
"r_y3": 371.39,
"coord_origin": "TOPLEFT"
},
"text": "Multi-Head Attention",
"orig": "Multi-Head Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 78.51,
"t": 391.32,
"r": 84.64,
"b": 396.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.51,
"r_y0": 396.98,
"r_x1": 84.64,
"r_y1": 396.98,
"r_x2": 84.64,
"r_y2": 391.32,
"r_x3": 78.51,
"r_y3": 391.32,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 116.53,
"t": 391.32,
"r": 125.11,
"b": 396.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.53,
"r_y0": 396.98,
"r_x1": 125.11,
"r_y1": 396.98,
"r_x2": 125.11,
"r_y2": 391.32,
"r_x3": 116.53,
"r_y3": 391.32,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 76.02,
"t": 424.45,
"r": 127.92,
"b": 430.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.02,
"r_y0": 430.12,
"r_x1": 127.92,
"r_y1": 430.12,
"r_x2": 127.92,
"r_y2": 424.45,
"r_x3": 76.02,
"r_y3": 424.45,
"coord_origin": "TOPLEFT"
},
"text": "Feed Forward Network",
"orig": "Feed Forward Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 78.38,
"t": 444.89,
"r": 84.51,
"b": 450.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.38,
"r_y0": 450.55,
"r_x1": 84.51,
"r_y1": 450.55,
"r_x2": 84.51,
"r_y2": 444.89,
"r_x3": 78.38,
"r_y3": 444.89,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 116.4,
"t": 444.89,
"r": 124.98,
"b": 450.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.4,
"r_y0": 450.55,
"r_x1": 124.98,
"r_y1": 450.55,
"r_x2": 124.98,
"r_y2": 444.89,
"r_x3": 116.4,
"r_y3": 444.89,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 167.47,
"t": 462.44,
"r": 181.63,
"b": 468.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 167.47,
"r_y0": 468.11,
"r_x1": 181.63,
"r_y1": 468.11,
"r_x2": 181.63,
"r_y2": 462.44,
"r_x3": 167.47,
"r_y3": 462.44,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 165.61,
"t": 478.47,
"r": 184.43,
"b": 484.13,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 165.61,
"r_y0": 484.13,
"r_x1": 184.43,
"r_y1": 484.13,
"r_x2": 184.43,
"r_y2": 478.47,
"r_x3": 165.61,
"r_y3": 478.47,
"coord_origin": "TOPLEFT"
},
"text": "Softmax",
"orig": "Softmax",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 65.32,
"t": 324.26,
"r": 132.92,
"b": 330.22,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.32,
"r_y0": 330.22,
"r_x1": 132.92,
"r_y1": 330.22,
"r_x2": 132.92,
"r_y2": 324.26,
"r_x3": 65.32,
"r_y3": 324.26,
"coord_origin": "TOPLEFT"
},
"text": "CNN BACKBONE ENCODER",
"orig": "CNN BACKBONE ENCODER",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 119.51,
"t": 269.66,
"r": 162.99,
"b": 274.73,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.51,
"r_y0": 274.73,
"r_x1": 162.99,
"r_y1": 274.73,
"r_x2": 162.99,
"r_y2": 269.66,
"r_x3": 119.51,
"r_y3": 269.66,
"coord_origin": "TOPLEFT"
},
"text": "[30, 1, 2, 3, 4, \u2026 3, ",
"orig": "[30, 1, 2, 3, 4, \u2026 3, ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 128.73,
"t": 274.91,
"r": 151.41,
"b": 279.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.73,
"r_y0": 279.98,
"r_x1": 151.41,
"r_y1": 279.98,
"r_x2": 151.41,
"r_y2": 274.91,
"r_x3": 128.73,
"r_y3": 274.91,
"coord_origin": "TOPLEFT"
},
"text": "4, 5, 8, 31]",
"orig": "4, 5, 8, 31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 60.43,
"t": 338.96,
"r": 80.27,
"b": 344.27,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.43,
"r_y0": 344.27,
"r_x1": 80.27,
"r_y1": 344.27,
"r_x2": 80.27,
"r_y2": 338.96,
"r_x3": 60.43,
"r_y3": 338.96,
"coord_origin": "TOPLEFT"
},
"text": "Positional ",
"orig": "Positional ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 60.6,
"t": 343.39,
"r": 78.85,
"b": 348.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.6,
"r_y0": 348.7,
"r_x1": 78.85,
"r_y1": 348.7,
"r_x2": 78.85,
"r_y2": 343.39,
"r_x3": 60.6,
"r_y3": 343.39,
"coord_origin": "TOPLEFT"
},
"text": "Encoding",
"orig": "Encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 134.83,
"t": 293.38,
"r": 154.66,
"b": 298.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.83,
"r_y0": 298.69,
"r_x1": 154.66,
"r_y1": 298.69,
"r_x2": 154.66,
"r_y2": 293.38,
"r_x3": 134.83,
"r_y3": 293.38,
"coord_origin": "TOPLEFT"
},
"text": "Positional ",
"orig": "Positional ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 134.99,
"t": 297.8,
"r": 153.25,
"b": 303.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.99,
"r_y0": 303.11,
"r_x1": 153.25,
"r_y1": 303.11,
"r_x2": 153.25,
"r_y2": 297.8,
"r_x3": 134.99,
"r_y3": 297.8,
"coord_origin": "TOPLEFT"
},
"text": "Encoding",
"orig": "Encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 150.55,
"t": 345.36,
"r": 197.15,
"b": 351.02,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.55,
"r_y0": 351.02,
"r_x1": 197.15,
"r_y1": 351.02,
"r_x2": 197.15,
"r_y2": 345.36,
"r_x3": 150.55,
"r_y3": 345.36,
"coord_origin": "TOPLEFT"
},
"text": "Add & Normalisation",
"orig": "Add & Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 150.55,
"t": 394.42,
"r": 156.68,
"b": 400.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.55,
"r_y0": 400.09,
"r_x1": 156.68,
"r_y1": 400.09,
"r_x2": 156.68,
"r_y2": 394.42,
"r_x3": 150.55,
"r_y3": 394.42,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 188.57,
"t": 394.42,
"r": 197.15,
"b": 400.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.57,
"r_y0": 400.09,
"r_x1": 197.15,
"r_y1": 400.09,
"r_x2": 197.15,
"r_y2": 394.42,
"r_x3": 188.57,
"r_y3": 394.42,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 150.19,
"t": 375.67,
"r": 197.32,
"b": 381.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.19,
"r_y0": 381.33,
"r_x1": 197.32,
"r_y1": 381.33,
"r_x2": 197.32,
"r_y2": 375.67,
"r_x3": 150.19,
"r_y3": 375.67,
"coord_origin": "TOPLEFT"
},
"text": "Multi-Head Attention",
"orig": "Multi-Head Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 150.55,
"t": 440.25,
"r": 156.68,
"b": 445.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.55,
"r_y0": 445.91,
"r_x1": 156.68,
"r_y1": 445.91,
"r_x2": 156.68,
"r_y2": 440.25,
"r_x3": 150.55,
"r_y3": 440.25,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 188.57,
"t": 440.25,
"r": 197.15,
"b": 445.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.57,
"r_y0": 445.91,
"r_x1": 197.15,
"r_y1": 445.91,
"r_x2": 197.15,
"r_y2": 440.25,
"r_x3": 188.57,
"r_y3": 440.25,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 147.86,
"t": 422.09,
"r": 199.76,
"b": 427.76,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.86,
"r_y0": 427.76,
"r_x1": 199.76,
"r_y1": 427.76,
"r_x2": 199.76,
"r_y2": 422.09,
"r_x3": 147.86,
"r_y3": 422.09,
"coord_origin": "TOPLEFT"
},
"text": "Feed Forward Network",
"orig": "Feed Forward Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 241.57,
"t": 314.26,
"r": 255.73,
"b": 319.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.57,
"r_y0": 319.92,
"r_x1": 255.73,
"r_y1": 319.92,
"r_x2": 255.73,
"r_y2": 314.26,
"r_x3": 241.57,
"r_y3": 314.26,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 241.92,
"t": 361.36,
"r": 256.08,
"b": 367.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.92,
"r_y0": 367.03,
"r_x1": 256.08,
"r_y1": 367.03,
"r_x2": 256.08,
"r_y2": 361.36,
"r_x3": 241.92,
"r_y3": 361.36,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 228.05,
"t": 336.62,
"r": 248.72,
"b": 342.28,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.05,
"r_y0": 342.28,
"r_x1": 248.72,
"r_y1": 342.28,
"r_x2": 248.72,
"r_y2": 336.62,
"r_x3": 228.05,
"r_y3": 336.62,
"coord_origin": "TOPLEFT"
},
"text": "Attention",
"orig": "Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 246.29,
"t": 336.62,
"r": 269.39,
"b": 342.28,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.29,
"r_y0": 342.28,
"r_x1": 269.39,
"r_y1": 342.28,
"r_x2": 269.39,
"r_y2": 336.62,
"r_x3": 246.29,
"r_y3": 336.62,
"coord_origin": "TOPLEFT"
},
"text": "Network",
"orig": "Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 228.45,
"t": 405.15,
"r": 238.74,
"b": 410.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.45,
"r_y0": 410.81,
"r_x1": 238.74,
"r_y1": 410.81,
"r_x2": 238.74,
"r_y2": 405.15,
"r_x3": 228.45,
"r_y3": 405.15,
"coord_origin": "TOPLEFT"
},
"text": "MLP",
"orig": "MLP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 256.3,
"t": 405.2,
"r": 271.78,
"b": 410.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.3,
"r_y0": 410.87,
"r_x1": 271.78,
"r_y1": 410.87,
"r_x2": 271.78,
"r_y2": 405.2,
"r_x3": 256.3,
"r_y3": 405.2,
"coord_origin": "TOPLEFT"
},
"text": "Linear ",
"orig": "Linear ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 239.55,
"t": 382.21,
"r": 258.09,
"b": 387.88,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.55,
"r_y0": 387.88,
"r_x1": 258.09,
"r_y1": 387.88,
"r_x2": 258.09,
"r_y2": 382.21,
"r_x3": 239.55,
"r_y3": 382.21,
"coord_origin": "TOPLEFT"
},
"text": "Sigmoid",
"orig": "Sigmoid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 54.15,
"t": 384.87,
"r": 59.51,
"b": 449.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.15,
"r_y0": 449.78,
"r_x1": 59.51,
"r_y1": 449.78,
"r_x2": 59.51,
"r_y2": 384.87,
"r_x3": 54.15,
"r_y3": 384.87,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Encoder Network",
"orig": "Transformer Encoder Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 54.24,
"t": 373.81,
"r": 59.3,
"b": 378.45,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.24,
"r_y0": 378.45,
"r_x1": 59.3,
"r_y1": 378.45,
"r_x2": 59.3,
"r_y2": 373.81,
"r_x3": 54.24,
"r_y3": 373.81,
"coord_origin": "TOPLEFT"
},
"text": "x2",
"orig": "x2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 85.3,
"t": 484.53,
"r": 122.16,
"b": 490.37,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.3,
"r_y0": 490.37,
"r_x1": 122.16,
"r_y1": 490.37,
"r_x2": 122.16,
"r_y2": 484.53,
"r_x3": 85.3,
"r_y3": 484.53,
"coord_origin": "TOPLEFT"
},
"text": "Encoded Output",
"orig": "Encoded Output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 229.67,
"t": 279.55,
"r": 265.32,
"b": 285.46,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.67,
"r_y0": 285.46,
"r_x1": 265.32,
"r_y1": 285.46,
"r_x2": 265.32,
"r_y2": 279.55,
"r_x3": 229.67,
"r_y3": 279.55,
"coord_origin": "TOPLEFT"
},
"text": "Encoded Output",
"orig": "Encoded Output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 157.17,
"t": 500.3,
"r": 190.42,
"b": 506.13,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.17,
"r_y0": 506.13,
"r_x1": 190.42,
"r_y1": 506.13,
"r_x2": 190.42,
"r_y2": 500.3,
"r_x3": 157.17,
"r_y3": 500.3,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Tags",
"orig": "Predicted Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 227.82,
"t": 438.06,
"r": 270.78,
"b": 443.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.82,
"r_y0": 443.89,
"r_x1": 270.78,
"r_y1": 443.89,
"r_x2": 270.78,
"r_y2": 438.06,
"r_x3": 227.82,
"r_y3": 438.06,
"coord_origin": "TOPLEFT"
},
"text": "Bounding Boxes & ",
"orig": "Bounding Boxes & ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 233.7,
"t": 444.06,
"r": 263.51,
"b": 449.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.7,
"r_y0": 449.89,
"r_x1": 263.51,
"r_y1": 449.89,
"r_x2": 263.51,
"r_y2": 444.06,
"r_x3": 233.7,
"r_y3": 444.06,
"coord_origin": "TOPLEFT"
},
"text": "Classification",
"orig": "Classification",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 184.75,
"t": 293.4,
"r": 212.16,
"b": 298.76,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.75,
"r_y0": 298.76,
"r_x1": 212.16,
"r_y1": 298.76,
"r_x2": 212.16,
"r_y2": 293.4,
"r_x3": 184.75,
"r_y3": 293.4,
"coord_origin": "TOPLEFT"
},
"text": "Transformer ",
"orig": "Transformer ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 178.91,
"t": 299.15,
"r": 216.74,
"b": 304.51,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.91,
"r_y0": 304.51,
"r_x1": 216.74,
"r_y1": 304.51,
"r_x2": 216.74,
"r_y2": 299.15,
"r_x3": 178.91,
"r_y3": 299.15,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Network",
"orig": "Decoder Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 194.25,
"t": 282.78,
"r": 198.89,
"b": 287.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 194.25,
"r_y0": 287.85,
"r_x1": 198.89,
"r_y1": 287.85,
"r_x2": 198.89,
"r_y2": 282.78,
"r_x3": 194.25,
"r_y3": 282.78,
"coord_origin": "TOPLEFT"
},
"text": "x4",
"orig": "x4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 221.46,
"t": 271.87,
"r": 276.47,
"b": 277.83,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.46,
"r_y0": 277.83,
"r_x1": 276.47,
"r_y1": 277.83,
"r_x2": 276.47,
"r_y2": 271.87,
"r_x3": 221.46,
"r_y3": 271.87,
"coord_origin": "TOPLEFT"
},
"text": "CELL BBOX DECODER",
"orig": "CELL BBOX DECODER",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 151.65,
"t": 323.44,
"r": 197.29,
"b": 329.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 151.65,
"r_y0": 329.1,
"r_x1": 197.29,
"r_y1": 329.1,
"r_x2": 197.29,
"r_y2": 323.44,
"r_x3": 151.65,
"r_y3": 323.44,
"coord_origin": "TOPLEFT"
},
"text": "Masked Multi-Head ",
"orig": "Masked Multi-Head ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 163.43,
"t": 329.44,
"r": 184.19,
"b": 335.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 163.43,
"r_y0": 335.1,
"r_x1": 184.19,
"r_y1": 335.1,
"r_x2": 184.19,
"r_y2": 329.44,
"r_x3": 163.43,
"r_y3": 329.44,
"coord_origin": "TOPLEFT"
},
"text": "Attention",
"orig": "Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 8,
"page_no": 4,
"cluster": {
"id": 8,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 527.78,
"r": 286.37,
"b": 680.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.891,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 536.81,
"r_x1": 229.79,
"r_y1": 536.81,
"r_x2": 229.79,
"r_y2": 527.9,
"r_x3": 50.11,
"r_y3": 527.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 4: Given an input image of a table, the",
"orig": "Figure 4: Given an input image of a table, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.79,
"r_y0": 536.74,
"r_x1": 267.76,
"r_y1": 536.74,
"r_x2": 267.76,
"r_y2": 527.78,
"r_x3": 231.79,
"r_y3": 527.78,
"coord_origin": "TOPLEFT"
},
"text": "Encoder",
"orig": "Encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 269.76,
"r_y0": 536.81,
"r_x1": 286.36,
"r_y1": 536.81,
"r_x2": 286.36,
"r_y2": 527.9,
"r_x3": 269.76,
"r_y3": 527.9,
"coord_origin": "TOPLEFT"
},
"text": "pro-",
"orig": "pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 548.76,
"r_x1": 286.37,
"r_y1": 548.76,
"r_x2": 286.37,
"r_y2": 539.86,
"r_x3": 50.11,
"r_y3": 539.86,
"coord_origin": "TOPLEFT"
},
"text": "duces fixed-length features that represent the input image.",
"orig": "duces fixed-length features that represent the input image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 560.72,
"r_x1": 205.85,
"r_y1": 560.72,
"r_x2": 205.85,
"r_y2": 551.81,
"r_x3": 50.11,
"r_y3": 551.81,
"coord_origin": "TOPLEFT"
},
"text": "The features are then passed to both the",
"orig": "The features are then passed to both the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.02,
"r_y0": 560.65,
"r_x1": 286.36,
"r_y1": 560.65,
"r_x2": 286.36,
"r_y2": 551.69,
"r_x3": 208.02,
"r_y3": 551.69,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 572.67,
"r_x1": 64.5,
"r_y1": 572.67,
"r_x2": 64.5,
"r_y2": 563.77,
"r_x3": 50.11,
"r_y3": 563.77,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.17,
"r_y0": 572.61,
"r_x1": 151.31,
"r_y1": 572.61,
"r_x2": 151.31,
"r_y2": 563.65,
"r_x3": 68.17,
"r_y3": 563.65,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 151.31,
"r_y0": 572.67,
"r_x1": 153.8,
"r_y1": 572.67,
"r_x2": 153.8,
"r_y2": 563.77,
"r_x3": 151.31,
"r_y3": 563.77,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.42,
"r_y0": 572.67,
"r_x1": 241.93,
"r_y1": 572.67,
"r_x2": 241.93,
"r_y2": 563.77,
"r_x3": 160.42,
"r_y3": 563.77,
"coord_origin": "TOPLEFT"
},
"text": "During training, the",
"orig": "During training, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.6,
"r_y0": 572.61,
"r_x1": 286.36,
"r_y1": 572.61,
"r_x2": 286.36,
"r_y2": 563.65,
"r_x3": 245.6,
"r_y3": 563.65,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 584.56,
"r_x1": 85.52,
"r_y1": 584.56,
"r_x2": 85.52,
"r_y2": 575.6,
"r_x3": 50.11,
"r_y3": 575.6,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.62,
"r_y0": 584.63,
"r_x1": 286.36,
"r_y1": 584.63,
"r_x2": 286.36,
"r_y2": 575.72,
"r_x3": 88.62,
"r_y3": 575.72,
"coord_origin": "TOPLEFT"
},
"text": "receives \u2018tokenized tags\u2019 of the HTML code that",
"orig": "receives \u2018tokenized tags\u2019 of the HTML code that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 596.58,
"r_x1": 286.37,
"r_y1": 596.58,
"r_x2": 286.37,
"r_y2": 587.68,
"r_x3": 50.11,
"r_y3": 587.68,
"coord_origin": "TOPLEFT"
},
"text": "represent the table structure. Afterwards, a transformer en-",
"orig": "represent the table structure. Afterwards, a transformer en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 608.54,
"r_x1": 286.37,
"r_y1": 608.54,
"r_x2": 286.37,
"r_y2": 599.63,
"r_x3": 50.11,
"r_y3": 599.63,
"coord_origin": "TOPLEFT"
},
"text": "coder and decoder architecture is employed to produce fea-",
"orig": "coder and decoder architecture is employed to produce fea-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 620.49,
"r_x1": 240.44,
"r_y1": 620.49,
"r_x2": 240.44,
"r_y2": 611.59,
"r_x3": 50.11,
"r_y3": 611.59,
"coord_origin": "TOPLEFT"
},
"text": "tures that are received by a linear layer, and the",
"orig": "tures that are received by a linear layer, and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.2,
"r_y0": 620.43,
"r_x1": 286.37,
"r_y1": 620.43,
"r_x2": 286.37,
"r_y2": 611.47,
"r_x3": 243.2,
"r_y3": 611.47,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 632.38,
"r_x1": 286.37,
"r_y1": 632.38,
"r_x2": 286.37,
"r_y2": 623.42,
"r_x3": 50.11,
"r_y3": 623.42,
"coord_origin": "TOPLEFT"
},
"text": "Decoder. The linear layer is applied to the features to",
"orig": "Decoder. The linear layer is applied to the features to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 644.34,
"r_x1": 286.37,
"r_y1": 644.34,
"r_x2": 286.37,
"r_y2": 635.38,
"r_x3": 50.11,
"r_y3": 635.38,
"coord_origin": "TOPLEFT"
},
"text": "predict the tags. Simultaneously, the Cell BBox Decoder",
"orig": "predict the tags. Simultaneously, the Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 656.36,
"r_x1": 220.58,
"r_y1": 656.36,
"r_x2": 220.58,
"r_y2": 647.45,
"r_x3": 50.11,
"r_y3": 647.45,
"coord_origin": "TOPLEFT"
},
"text": "selects features referring to the data cells (\u2018",
"orig": "selects features referring to the data cells (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.58,
"r_y0": 656.14,
"r_x1": 228.33,
"r_y1": 656.14,
"r_x2": 228.33,
"r_y2": 647.29,
"r_x3": 220.58,
"r_y3": 647.29,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.33,
"r_y0": 656.36,
"r_x1": 236.08,
"r_y1": 656.36,
"r_x2": 236.08,
"r_y2": 647.45,
"r_x3": 228.33,
"r_y3": 647.45,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.08,
"r_y0": 656.14,
"r_x1": 243.83,
"r_y1": 656.14,
"r_x2": 243.83,
"r_y2": 647.29,
"r_x3": 236.08,
"r_y3": 647.29,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.83,
"r_y0": 656.36,
"r_x1": 255.29,
"r_y1": 656.36,
"r_x2": 255.29,
"r_y2": 647.45,
"r_x3": 243.83,
"r_y3": 647.45,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018",
"orig": "\u2019, \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.29,
"r_y0": 656.14,
"r_x1": 263.04,
"r_y1": 656.14,
"r_x2": 263.04,
"r_y2": 647.29,
"r_x3": 255.29,
"r_y3": 647.29,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.04,
"r_y0": 656.36,
"r_x1": 286.36,
"r_y1": 656.36,
"r_x2": 286.36,
"r_y2": 647.45,
"r_x3": 263.04,
"r_y3": 647.45,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) and",
"orig": "\u2019) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 668.32,
"r_x1": 286.37,
"r_y1": 668.32,
"r_x2": 286.37,
"r_y2": 659.41,
"r_x3": 50.11,
"r_y3": 659.41,
"coord_origin": "TOPLEFT"
},
"text": "passes them through an attention network, an MLP, and a",
"orig": "passes them through an attention network, an MLP, and a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 680.27,
"r_x1": 218.47,
"r_y1": 680.27,
"r_x2": 218.47,
"r_y2": 671.36,
"r_x3": 50.11,
"r_y3": 671.36,
"coord_origin": "TOPLEFT"
},
"text": "linear layer to predict the bounding boxes.",
"orig": "linear layer to predict the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 4: Given an input image of a table, the Encoder produces fixed-length features that represent the input image. The features are then passed to both the Structure Decoder and Cell BBox Decoder . During training, the Structure Decoder receives 'tokenized tags' of the HTML code that represent the table structure. Afterwards, a transformer encoder and decoder architecture is employed to produce features that are received by a linear layer, and the Cell BBox Decoder. The linear layer is applied to the features to predict the tags. Simultaneously, the Cell BBox Decoder selects features referring to the data cells (' < td > ', ' < ') and passes them through an attention network, an MLP, and a linear layer to predict the bounding boxes."
},
{
"label": "text",
"id": 4,
"page_no": 4,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.86,
"t": 249.53,
"r": 545.12,
"b": 294.31,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 258.44,
"r_x1": 523.06,
"r_y1": 258.44,
"r_x2": 523.06,
"r_y2": 249.53,
"r_x3": 308.86,
"r_y3": 249.53,
"coord_origin": "TOPLEFT"
},
"text": "forming classification, and adding an adaptive pooling",
"orig": "forming classification, and adding an adaptive pooling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 525.2,
"r_y0": 258.44,
"r_x1": 545.12,
"r_y1": 258.44,
"r_x2": 545.12,
"r_y2": 249.53,
"r_x3": 525.2,
"r_y3": 249.53,
"coord_origin": "TOPLEFT"
},
"text": "layer",
"orig": "layer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 270.4,
"r_x1": 517.56,
"r_y1": 270.4,
"r_x2": 517.56,
"r_y2": 261.49,
"r_x3": 308.86,
"r_y3": 261.49,
"coord_origin": "TOPLEFT"
},
"text": "of size 28*28. ResNet by default downsamples the",
"orig": "of size 28*28. ResNet by default downsamples the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 520.77,
"r_y0": 270.4,
"r_x1": 545.11,
"r_y1": 270.4,
"r_x2": 545.11,
"r_y2": 261.49,
"r_x3": 520.77,
"r_y3": 261.49,
"coord_origin": "TOPLEFT"
},
"text": "image",
"orig": "image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 282.35,
"r_x1": 534.8,
"r_y1": 282.35,
"r_x2": 534.8,
"r_y2": 273.45,
"r_x3": 308.86,
"r_y3": 273.45,
"coord_origin": "TOPLEFT"
},
"text": "resolution by 32 and then the encoded image is provided",
"orig": "resolution by 32 and then the encoded image is provided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.36,
"r_y0": 282.35,
"r_x1": 545.12,
"r_y1": 282.35,
"r_x2": 545.12,
"r_y2": 273.45,
"r_x3": 537.36,
"r_y3": 273.45,
"coord_origin": "TOPLEFT"
},
"text": "to",
"orig": "to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 294.31,
"r_x1": 341.24,
"r_y1": 294.31,
"r_x2": 341.24,
"r_y2": 285.4,
"r_x3": 308.86,
"r_y3": 285.4,
"coord_origin": "TOPLEFT"
},
"text": "both the",
"orig": "both the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.73,
"r_y0": 294.08,
"r_x1": 417.24,
"r_y1": 294.08,
"r_x2": 417.24,
"r_y2": 285.49,
"r_x3": 343.73,
"r_y3": 285.49,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.23,
"r_y0": 294.31,
"r_x1": 436.6,
"r_y1": 294.31,
"r_x2": 436.6,
"r_y2": 285.4,
"r_x3": 417.23,
"r_y3": 285.4,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.09,
"r_y0": 294.08,
"r_x1": 516.56,
"r_y1": 294.08,
"r_x2": 516.56,
"r_y2": 285.49,
"r_x3": 439.09,
"r_y3": 285.49,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.56,
"r_y0": 294.31,
"r_x1": 519.05,
"r_y1": 294.31,
"r_x2": 519.05,
"r_y2": 285.4,
"r_x3": 516.56,
"r_y3": 285.4,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "forming classification, and adding an adaptive pooling layer of size 28*28. ResNet by default downsamples the image resolution by 32 and then the encoded image is provided to both the Structure Decoder , and Cell BBox Decoder ."
},
{
"label": "text",
"id": 1,
"page_no": 4,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 297.34,
"r": 545.12,
"b": 413.96,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 306.3,
"r_x1": 400.87,
"r_y1": 306.3,
"r_x2": 400.87,
"r_y2": 297.34,
"r_x3": 320.82,
"r_y3": 297.34,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder.",
"orig": "Structure Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.91,
"r_y0": 306.37,
"r_x1": 528.34,
"r_y1": 306.37,
"r_x2": 528.34,
"r_y2": 297.46,
"r_x3": 403.91,
"r_y3": 297.46,
"coord_origin": "TOPLEFT"
},
"text": "The transformer architecture of",
"orig": "The transformer architecture of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 530.72,
"r_y0": 306.37,
"r_x1": 545.11,
"r_y1": 306.37,
"r_x2": 545.11,
"r_y2": 297.46,
"r_x3": 530.72,
"r_y3": 297.46,
"coord_origin": "TOPLEFT"
},
"text": "this",
"orig": "this",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 318.32,
"r_x1": 517.53,
"r_y1": 318.32,
"r_x2": 517.53,
"r_y2": 309.41,
"r_x3": 308.86,
"r_y3": 309.41,
"coord_origin": "TOPLEFT"
},
"text": "component is based on the work proposed in [31].",
"orig": "component is based on the work proposed in [31].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.09,
"r_y0": 318.32,
"r_x1": 545.11,
"r_y1": 318.32,
"r_x2": 545.11,
"r_y2": 309.41,
"r_x3": 524.09,
"r_y3": 309.41,
"coord_origin": "TOPLEFT"
},
"text": "After",
"orig": "After",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 330.28,
"r_x1": 432.36,
"r_y1": 330.28,
"r_x2": 432.36,
"r_y2": 321.37,
"r_x3": 308.86,
"r_y3": 321.37,
"coord_origin": "TOPLEFT"
},
"text": "extensive experimentation, the",
"orig": "extensive experimentation, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.82,
"r_y0": 330.05,
"r_x1": 510.29,
"r_y1": 330.05,
"r_x2": 510.29,
"r_y2": 321.46,
"r_x3": 435.82,
"r_y3": 321.46,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.98,
"r_y0": 330.28,
"r_x1": 520.62,
"r_y1": 330.28,
"r_x2": 520.62,
"r_y2": 321.37,
"r_x3": 513.98,
"r_y3": 321.37,
"coord_origin": "TOPLEFT"
},
"text": "is",
"orig": "is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.08,
"r_y0": 330.28,
"r_x1": 545.11,
"r_y1": 330.28,
"r_x2": 545.11,
"r_y2": 321.37,
"r_x3": 524.08,
"r_y3": 321.37,
"coord_origin": "TOPLEFT"
},
"text": "mod-",
"orig": "mod-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 342.23,
"r_x1": 527.76,
"r_y1": 342.23,
"r_x2": 527.76,
"r_y2": 333.32,
"r_x3": 308.86,
"r_y3": 333.32,
"coord_origin": "TOPLEFT"
},
"text": "eled as a transformer encoder with two encoder layers",
"orig": "eled as a transformer encoder with two encoder layers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 530.73,
"r_y0": 342.23,
"r_x1": 545.11,
"r_y1": 342.23,
"r_x2": 545.11,
"r_y2": 333.32,
"r_x3": 530.73,
"r_y3": 333.32,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 354.19,
"r_x1": 526.85,
"r_y1": 354.19,
"r_x2": 526.85,
"r_y2": 345.28,
"r_x3": 308.86,
"r_y3": 345.28,
"coord_origin": "TOPLEFT"
},
"text": "a transformer decoder made from a stack of 4 decoder",
"orig": "a transformer decoder made from a stack of 4 decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 354.19,
"r_x1": 545.11,
"r_y1": 354.19,
"r_x2": 545.11,
"r_y2": 345.28,
"r_x3": 529.62,
"r_y3": 345.28,
"coord_origin": "TOPLEFT"
},
"text": "lay-",
"orig": "lay-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 366.14,
"r_x1": 524.51,
"r_y1": 366.14,
"r_x2": 524.51,
"r_y2": 357.24,
"r_x3": 308.86,
"r_y3": 357.24,
"coord_origin": "TOPLEFT"
},
"text": "ers that comprise mainly of multi-head attention and",
"orig": "ers that comprise mainly of multi-head attention and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.97,
"r_y0": 366.14,
"r_x1": 545.12,
"r_y1": 366.14,
"r_x2": 545.12,
"r_y2": 357.24,
"r_x3": 527.97,
"r_y3": 357.24,
"coord_origin": "TOPLEFT"
},
"text": "feed",
"orig": "feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 378.1,
"r_x1": 370.39,
"r_y1": 378.1,
"r_x2": 370.39,
"r_y2": 369.19,
"r_x3": 308.86,
"r_y3": 369.19,
"coord_origin": "TOPLEFT"
},
"text": "forward layers.",
"orig": "forward layers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.44,
"r_y0": 378.1,
"r_x1": 526.91,
"r_y1": 378.1,
"r_x2": 526.91,
"r_y2": 369.19,
"r_x3": 377.44,
"r_y3": 369.19,
"coord_origin": "TOPLEFT"
},
"text": "This configuration uses fewer layers",
"orig": "This configuration uses fewer layers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 530.73,
"r_y0": 378.1,
"r_x1": 545.12,
"r_y1": 378.1,
"r_x2": 545.12,
"r_y2": 369.19,
"r_x3": 530.73,
"r_y3": 369.19,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 390.05,
"r_x1": 505.46,
"r_y1": 390.05,
"r_x2": 505.46,
"r_y2": 381.15,
"r_x3": 308.86,
"r_y3": 381.15,
"coord_origin": "TOPLEFT"
},
"text": "heads in comparison to networks applied to other",
"orig": "heads in comparison to networks applied to other",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.03,
"r_y0": 390.05,
"r_x1": 545.12,
"r_y1": 390.05,
"r_x2": 545.12,
"r_y2": 381.15,
"r_x3": 508.03,
"r_y3": 381.15,
"coord_origin": "TOPLEFT"
},
"text": "problems",
"orig": "problems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 402.01,
"r_x1": 517.69,
"r_y1": 402.01,
"r_x2": 517.69,
"r_y2": 393.1,
"r_x3": 308.86,
"r_y3": 393.1,
"coord_origin": "TOPLEFT"
},
"text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),",
"orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 520.77,
"r_y0": 402.01,
"r_x1": 545.11,
"r_y1": 402.01,
"r_x2": 545.11,
"r_y2": 393.1,
"r_x3": 520.77,
"r_y3": 393.1,
"coord_origin": "TOPLEFT"
},
"text": "some-",
"orig": "some-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 413.96,
"r_x1": 528.02,
"r_y1": 413.96,
"r_x2": 528.02,
"r_y2": 405.06,
"r_x3": 308.86,
"r_y3": 405.06,
"coord_origin": "TOPLEFT"
},
"text": "thing which we relate to the simplicity of table images.",
"orig": "thing which we relate to the simplicity of table images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Structure Decoder. The transformer architecture of this component is based on the work proposed in [31]. After extensive experimentation, the Structure Decoder is modeled as a transformer encoder with two encoder layers and a transformer decoder made from a stack of 4 decoder layers that comprise mainly of multi-head attention and feed forward layers. This configuration uses fewer layers and heads in comparison to networks applied to other problems (e.g. \"Scene Understanding\", \"Image Captioning\"), something which we relate to the simplicity of table images."
},
{
"label": "text",
"id": 3,
"page_no": 4,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 417.11,
"r": 545.12,
"b": 545.57,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 426.02,
"r_x1": 515.5,
"r_y1": 426.02,
"r_x2": 515.5,
"r_y2": 417.11,
"r_x3": 320.82,
"r_y3": 417.11,
"coord_origin": "TOPLEFT"
},
"text": "The transformer encoder receives an encoded",
"orig": "The transformer encoder receives an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 520.77,
"r_y0": 426.02,
"r_x1": 545.11,
"r_y1": 426.02,
"r_x2": 545.11,
"r_y2": 417.11,
"r_x3": 520.77,
"r_y3": 417.11,
"coord_origin": "TOPLEFT"
},
"text": "image",
"orig": "image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 437.98,
"r_x1": 343.72,
"r_y1": 437.98,
"r_x2": 343.72,
"r_y2": 429.07,
"r_x3": 308.86,
"r_y3": 429.07,
"coord_origin": "TOPLEFT"
},
"text": "from the",
"orig": "from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.04,
"r_y0": 437.75,
"r_x1": 446.45,
"r_y1": 437.75,
"r_x2": 446.45,
"r_y2": 429.16,
"r_x3": 347.04,
"r_y3": 429.16,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.94,
"r_y0": 437.98,
"r_x1": 503.06,
"r_y1": 437.98,
"r_x2": 503.06,
"r_y2": 429.07,
"r_x3": 449.94,
"r_y3": 429.07,
"coord_origin": "TOPLEFT"
},
"text": "and refines it",
"orig": "and refines it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 506.38,
"r_y0": 437.98,
"r_x1": 537.37,
"r_y1": 437.98,
"r_x2": 537.37,
"r_y2": 429.07,
"r_x3": 506.38,
"r_y3": 429.07,
"coord_origin": "TOPLEFT"
},
"text": "through",
"orig": "through",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 540.69,
"r_y0": 437.98,
"r_x1": 545.11,
"r_y1": 437.98,
"r_x2": 545.11,
"r_y2": 429.07,
"r_x3": 540.69,
"r_y3": 429.07,
"coord_origin": "TOPLEFT"
},
"text": "a",
"orig": "a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 449.93,
"r_x1": 522.79,
"r_y1": 449.93,
"r_x2": 522.79,
"r_y2": 441.02,
"r_x3": 308.86,
"r_y3": 441.02,
"coord_origin": "TOPLEFT"
},
"text": "multi-head dot-product attention layer, followed by a",
"orig": "multi-head dot-product attention layer, followed by a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 525.75,
"r_y0": 449.93,
"r_x1": 545.12,
"r_y1": 449.93,
"r_x2": 545.12,
"r_y2": 441.02,
"r_x3": 525.75,
"r_y3": 441.02,
"coord_origin": "TOPLEFT"
},
"text": "Feed",
"orig": "Feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 461.89,
"r_x1": 384.15,
"r_y1": 461.89,
"r_x2": 384.15,
"r_y2": 452.98,
"r_x3": 308.86,
"r_y3": 452.98,
"coord_origin": "TOPLEFT"
},
"text": "Forward Network.",
"orig": "Forward Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.37,
"r_y0": 461.89,
"r_x1": 527.85,
"r_y1": 461.89,
"r_x2": 527.85,
"r_y2": 452.98,
"r_x3": 393.37,
"r_y3": 452.98,
"coord_origin": "TOPLEFT"
},
"text": "During training, the transformer",
"orig": "During training, the transformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.39,
"r_y0": 461.89,
"r_x1": 545.12,
"r_y1": 461.89,
"r_x2": 545.12,
"r_y2": 452.98,
"r_x3": 532.39,
"r_y3": 452.98,
"coord_origin": "TOPLEFT"
},
"text": "de-",
"orig": "de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 473.84,
"r_x1": 529.76,
"r_y1": 473.84,
"r_x2": 529.76,
"r_y2": 464.94,
"r_x3": 308.86,
"r_y3": 464.94,
"coord_origin": "TOPLEFT"
},
"text": "coder receives as input the output feature produced by",
"orig": "coder receives as input the output feature produced by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.94,
"r_y0": 473.84,
"r_x1": 545.12,
"r_y1": 473.84,
"r_x2": 545.12,
"r_y2": 464.94,
"r_x3": 532.94,
"r_y3": 464.94,
"coord_origin": "TOPLEFT"
},
"text": "the",
"orig": "the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 485.8,
"r_x1": 514.17,
"r_y1": 485.8,
"r_x2": 514.17,
"r_y2": 476.89,
"r_x3": 308.86,
"r_y3": 476.89,
"coord_origin": "TOPLEFT"
},
"text": "transformer encoder, and the tokenized input of the",
"orig": "transformer encoder, and the tokenized input of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.89,
"r_y0": 485.8,
"r_x1": 545.12,
"r_y1": 485.8,
"r_x2": 545.12,
"r_y2": 476.89,
"r_x3": 516.89,
"r_y3": 476.89,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.75,
"r_x1": 527.63,
"r_y1": 497.75,
"r_x2": 527.63,
"r_y2": 488.85,
"r_x3": 308.86,
"r_y3": 488.85,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth tags. Using a stack of multi-head attention",
"orig": "ground-truth tags. Using a stack of multi-head attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.62,
"r_y0": 497.75,
"r_x1": 545.11,
"r_y1": 497.75,
"r_x2": 545.11,
"r_y2": 488.85,
"r_x3": 529.62,
"r_y3": 488.85,
"coord_origin": "TOPLEFT"
},
"text": "lay-",
"orig": "lay-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 509.71,
"r_x1": 508.36,
"r_y1": 509.71,
"r_x2": 508.36,
"r_y2": 500.8,
"r_x3": 308.86,
"r_y3": 500.8,
"coord_origin": "TOPLEFT"
},
"text": "ers, different aspects of the tag sequence could be",
"orig": "ers, different aspects of the tag sequence could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.09,
"r_y0": 509.71,
"r_x1": 545.12,
"r_y1": 509.71,
"r_x2": 545.12,
"r_y2": 500.8,
"r_x3": 511.09,
"r_y3": 500.8,
"coord_origin": "TOPLEFT"
},
"text": "inferred.",
"orig": "inferred.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 521.66,
"r_x1": 545.11,
"r_y1": 521.66,
"r_x2": 545.11,
"r_y2": 512.76,
"r_x3": 308.86,
"r_y3": 512.76,
"coord_origin": "TOPLEFT"
},
"text": "This is achieved by each attention head on a layer operating",
"orig": "This is achieved by each attention head on a layer operating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.62,
"r_x1": 545.12,
"r_y1": 533.62,
"r_x2": 545.12,
"r_y2": 524.71,
"r_x3": 308.86,
"r_y3": 524.71,
"coord_origin": "TOPLEFT"
},
"text": "in a different subspace, and then combining altogether their",
"orig": "in a different subspace, and then combining altogether their",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.57,
"r_x1": 369.73,
"r_y1": 545.57,
"r_x2": 369.73,
"r_y2": 536.67,
"r_x3": 308.86,
"r_y3": 536.67,
"coord_origin": "TOPLEFT"
},
"text": "attention score.",
"orig": "attention score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The transformer encoder receives an encoded image from the CNN Backbone Network and refines it through a multi-head dot-product attention layer, followed by a Feed Forward Network. During training, the transformer decoder receives as input the output feature produced by the transformer encoder, and the tokenized input of the HTML ground-truth tags. Using a stack of multi-head attention layers, different aspects of the tag sequence could be inferred. This is achieved by each attention head on a layer operating in a different subspace, and then combining altogether their attention score."
},
{
"label": "text",
"id": 0,
"page_no": 4,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 548.6,
"r": 545.12,
"b": 653.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 557.56,
"r_x1": 404.76,
"r_y1": 557.56,
"r_x2": 404.76,
"r_y2": 548.6,
"r_x3": 320.82,
"r_y3": 548.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder.",
"orig": "Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.34,
"r_y0": 557.63,
"r_x1": 545.12,
"r_y1": 557.63,
"r_x2": 545.12,
"r_y2": 548.72,
"r_x3": 410.34,
"r_y3": 548.72,
"coord_origin": "TOPLEFT"
},
"text": "Our architecture allows to simul-",
"orig": "Our architecture allows to simul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.59,
"r_x1": 545.11,
"r_y1": 569.59,
"r_x2": 545.11,
"r_y2": 560.68,
"r_x3": 308.86,
"r_y3": 560.68,
"coord_origin": "TOPLEFT"
},
"text": "taneously predict HTML tags and bounding boxes for each",
"orig": "taneously predict HTML tags and bounding boxes for each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.54,
"r_x1": 545.12,
"r_y1": 581.54,
"r_x2": 545.12,
"r_y2": 572.64,
"r_x3": 308.86,
"r_y3": 572.64,
"coord_origin": "TOPLEFT"
},
"text": "table cell without the need of a separate object detector end",
"orig": "table cell without the need of a separate object detector end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.5,
"r_x1": 545.11,
"r_y1": 593.5,
"r_x2": 545.11,
"r_y2": 584.59,
"r_x3": 308.86,
"r_y3": 584.59,
"coord_origin": "TOPLEFT"
},
"text": "to end. This approach is inspired by DETR [1] which em-",
"orig": "to end. This approach is inspired by DETR [1] which em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.45,
"r_x1": 545.11,
"r_y1": 605.45,
"r_x2": 545.11,
"r_y2": 596.55,
"r_x3": 308.86,
"r_y3": 596.55,
"coord_origin": "TOPLEFT"
},
"text": "ploys a Transformer Encoder, and Decoder that looks for",
"orig": "ploys a Transformer Encoder, and Decoder that looks for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.41,
"r_x1": 545.12,
"r_y1": 617.41,
"r_x2": 545.12,
"r_y2": 608.5,
"r_x3": 308.86,
"r_y3": 608.5,
"coord_origin": "TOPLEFT"
},
"text": "a specific number of object queries (potential object detec-",
"orig": "a specific number of object queries (potential object detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.36,
"r_x1": 545.12,
"r_y1": 629.36,
"r_x2": 545.12,
"r_y2": 620.46,
"r_x3": 308.86,
"r_y3": 620.46,
"coord_origin": "TOPLEFT"
},
"text": "tions). As our model utilizes a transformer architecture, the",
"orig": "tions). As our model utilizes a transformer architecture, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.32,
"r_x1": 381.68,
"r_y1": 641.32,
"r_x2": 381.68,
"r_y2": 632.41,
"r_x3": 308.86,
"r_y3": 632.41,
"coord_origin": "TOPLEFT"
},
"text": "hidden state of the",
"orig": "hidden state of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 641.1,
"r_x1": 391.75,
"r_y1": 641.1,
"r_x2": 391.75,
"r_y2": 632.25,
"r_x3": 384.0,
"r_y3": 632.25,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.75,
"r_y0": 641.32,
"r_x1": 399.5,
"r_y1": 641.32,
"r_x2": 399.5,
"r_y2": 632.41,
"r_x3": 391.75,
"r_y3": 632.41,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 399.5,
"r_y0": 641.1,
"r_x1": 407.25,
"r_y1": 641.1,
"r_x2": 407.25,
"r_y2": 632.25,
"r_x3": 399.5,
"r_y3": 632.25,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 407.25,
"r_y0": 641.32,
"r_x1": 432.91,
"r_y1": 641.32,
"r_x2": 432.91,
"r_y2": 632.41,
"r_x3": 407.25,
"r_y3": 632.41,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 and \u2018",
"orig": "\u2019 and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 432.91,
"r_y0": 641.1,
"r_x1": 440.66,
"r_y1": 641.1,
"r_x2": 440.66,
"r_y2": 632.25,
"r_x3": 432.91,
"r_y3": 632.25,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.66,
"r_y0": 641.32,
"r_x1": 545.11,
"r_y1": 641.32,
"r_x2": 545.11,
"r_y2": 632.41,
"r_x3": 440.66,
"r_y3": 632.41,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 HTML structure tags be-",
"orig": "\u2019 HTML structure tags be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.27,
"r_x1": 398.96,
"r_y1": 653.27,
"r_x2": 398.96,
"r_y2": 644.37,
"r_x3": 308.86,
"r_y3": 644.37,
"coord_origin": "TOPLEFT"
},
"text": "come the object query.",
"orig": "come the object query.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell BBox Decoder. Our architecture allows to simultaneously predict HTML tags and bounding boxes for each table cell without the need of a separate object detector end to end. This approach is inspired by DETR [1] which employs a Transformer Encoder, and Decoder that looks for a specific number of object queries (potential object detections). As our model utilizes a transformer architecture, the hidden state of the < td > ' and ' < ' HTML structure tags become the object query."
},
{
"label": "text",
"id": 2,
"page_no": 4,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 656.43,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 665.33,
"r_x1": 444.34,
"r_y1": 665.33,
"r_x2": 444.34,
"r_y2": 656.43,
"r_x3": 320.82,
"r_y3": 656.43,
"coord_origin": "TOPLEFT"
},
"text": "The encoding generated by the",
"orig": "The encoding generated by the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 447.01,
"r_y0": 665.1,
"r_x1": 545.11,
"r_y1": 665.1,
"r_x2": 545.11,
"r_y2": 656.51,
"r_x3": 447.01,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.29,
"r_x1": 545.12,
"r_y1": 677.29,
"r_x2": 545.12,
"r_y2": 668.38,
"r_x3": 308.86,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "along with the features acquired for every data cell from the",
"orig": "along with the features acquired for every data cell from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 308.86,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder are then passed to the attention net-",
"orig": "Transformer Decoder are then passed to the attention net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "work. The attention network takes both inputs and learns to",
"orig": "work. The attention network takes both inputs and learns to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "provide an attention weighted encoding. This weighted at-",
"orig": "provide an attention weighted encoding. This weighted at-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The encoding generated by the CNN Backbone Network along with the features acquired for every data cell from the Transformer Decoder are then passed to the attention network. The attention network takes both inputs and learns to provide an attention weighted encoding. This weighted at-"
}
],
"headers": [
{
"label": "page_footer",
"id": 9,
"page_no": 4,
"cluster": {
"id": 9,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5"
}
]
}
},
{
"page_no": 5,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "tention encoding is then multiplied to the encoded image to",
"orig": "tention encoding is then multiplied to the encoded image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 286.37,
"r_y1": 96.07,
"r_x2": 286.37,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "produce a feature for each table cell. Notice that this is dif-",
"orig": "produce a feature for each table cell. Notice that this is dif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.02,
"r_x1": 286.37,
"r_y1": 108.02,
"r_x2": 286.37,
"r_y2": 99.12,
"r_x3": 50.11,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "ferent than the typical object detection problem where im-",
"orig": "ferent than the typical object detection problem where im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 119.98,
"r_x1": 286.37,
"r_y1": 119.98,
"r_x2": 286.37,
"r_y2": 111.07,
"r_x3": 50.11,
"r_y3": 111.07,
"coord_origin": "TOPLEFT"
},
"text": "balances between the number of detections and the amount",
"orig": "balances between the number of detections and the amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.93,
"r_x1": 286.37,
"r_y1": 131.93,
"r_x2": 286.37,
"r_y2": 123.03,
"r_x3": 50.11,
"r_y3": 123.03,
"coord_origin": "TOPLEFT"
},
"text": "of objects may exist. In our case, we know up front that",
"orig": "of objects may exist. In our case, we know up front that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 143.89,
"r_x1": 286.37,
"r_y1": 143.89,
"r_x2": 286.37,
"r_y2": 134.98,
"r_x3": 50.11,
"r_y3": 134.98,
"coord_origin": "TOPLEFT"
},
"text": "the produced detections always match with the table cells",
"orig": "the produced detections always match with the table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 155.85,
"r_x1": 175.16,
"r_y1": 155.85,
"r_x2": 175.16,
"r_y2": 146.94,
"r_x3": 50.11,
"r_y3": 146.94,
"coord_origin": "TOPLEFT"
},
"text": "in number and correspondence.",
"orig": "in number and correspondence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 168.53,
"r_x1": 286.36,
"r_y1": 168.53,
"r_x2": 286.36,
"r_y2": 159.62,
"r_x3": 62.07,
"r_y3": 159.62,
"coord_origin": "TOPLEFT"
},
"text": "The output features for each table cell are then fed",
"orig": "The output features for each table cell are then fed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 180.49,
"r_x1": 286.37,
"r_y1": 180.49,
"r_x2": 286.37,
"r_y2": 171.58,
"r_x3": 50.11,
"r_y3": 171.58,
"coord_origin": "TOPLEFT"
},
"text": "into the feed-forward network (FFN). The FFN consists",
"orig": "into the feed-forward network (FFN). The FFN consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 192.44,
"r_x1": 286.37,
"r_y1": 192.44,
"r_x2": 286.37,
"r_y2": 183.54,
"r_x3": 50.11,
"r_y3": 183.54,
"coord_origin": "TOPLEFT"
},
"text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 204.4,
"r_x1": 286.37,
"r_y1": 204.4,
"r_x2": 286.37,
"r_y2": 195.49,
"r_x3": 50.11,
"r_y3": 195.49,
"coord_origin": "TOPLEFT"
},
"text": "tion function) that predicts the normalized coordinates for",
"orig": "tion function) that predicts the normalized coordinates for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 216.35,
"r_x1": 286.37,
"r_y1": 216.35,
"r_x2": 286.37,
"r_y2": 207.45,
"r_x3": 50.11,
"r_y3": 207.45,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table cell. Finally, the predicted",
"orig": "the bounding box of each table cell. Finally, the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 228.31,
"r_x1": 286.37,
"r_y1": 228.31,
"r_x2": 286.37,
"r_y2": 219.4,
"r_x3": 50.11,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes are classified based on whether they are",
"orig": "bounding boxes are classified based on whether they are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 240.26,
"r_x1": 181.55,
"r_y1": 240.26,
"r_x2": 181.55,
"r_y2": 231.36,
"r_x3": 50.11,
"r_y3": 231.36,
"coord_origin": "TOPLEFT"
},
"text": "empty or not using a linear layer.",
"orig": "empty or not using a linear layer.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 252.88,
"r_x1": 129.21,
"r_y1": 252.88,
"r_x2": 129.21,
"r_y2": 243.92,
"r_x3": 62.07,
"r_y3": 243.92,
"coord_origin": "TOPLEFT"
},
"text": "Loss Functions.",
"orig": "Loss Functions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.45,
"r_y0": 252.95,
"r_x1": 286.36,
"r_y1": 252.95,
"r_x2": 286.36,
"r_y2": 244.04,
"r_x3": 134.45,
"r_y3": 244.04,
"coord_origin": "TOPLEFT"
},
"text": "We formulate a multi-task loss Eq. 2",
"orig": "We formulate a multi-task loss Eq. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.9,
"r_x1": 286.37,
"r_y1": 264.9,
"r_x2": 286.37,
"r_y2": 256.0,
"r_x3": 50.11,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "to train our network. The Cross-Entropy loss (denoted as",
"orig": "to train our network. The Cross-Entropy loss (denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.64,
"r_x1": 56.85,
"r_y1": 276.64,
"r_x2": 56.85,
"r_y2": 267.79,
"r_x3": 50.11,
"r_y3": 267.79,
"coord_origin": "TOPLEFT"
},
"text": "l$_{s}$",
"orig": "l$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 57.34,
"r_y0": 276.86,
"r_x1": 135.4,
"r_y1": 276.86,
"r_x2": 135.4,
"r_y2": 267.95,
"r_x3": 57.34,
"r_y3": 267.95,
"coord_origin": "TOPLEFT"
},
"text": ") is used to train the",
"orig": ") is used to train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.74,
"r_y0": 276.63,
"r_x1": 211.08,
"r_y1": 276.63,
"r_x2": 211.08,
"r_y2": 268.04,
"r_x3": 137.74,
"r_y3": 268.04,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.64,
"r_y0": 276.86,
"r_x1": 286.36,
"r_y1": 276.86,
"r_x2": 286.36,
"r_y2": 267.95,
"r_x3": 213.64,
"r_y3": 267.95,
"coord_origin": "TOPLEFT"
},
"text": "which predicts the",
"orig": "which predicts the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.81,
"r_x1": 158.82,
"r_y1": 288.81,
"r_x2": 158.82,
"r_y2": 279.91,
"r_x3": 50.11,
"r_y3": 279.91,
"coord_origin": "TOPLEFT"
},
"text": "structure tokens. As for the",
"orig": "structure tokens. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.32,
"r_y0": 288.58,
"r_x1": 238.8,
"r_y1": 288.58,
"r_x2": 238.8,
"r_y2": 280.0,
"r_x3": 161.32,
"r_y3": 280.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.52,
"r_y0": 288.81,
"r_x1": 286.36,
"r_y1": 288.81,
"r_x2": 286.36,
"r_y2": 279.91,
"r_x3": 241.52,
"r_y3": 279.91,
"coord_origin": "TOPLEFT"
},
"text": "it is trained",
"orig": "it is trained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.77,
"r_x1": 211.38,
"r_y1": 300.77,
"r_x2": 211.38,
"r_y2": 291.86,
"r_x3": 50.11,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": "with a combination of losses denoted as",
"orig": "with a combination of losses denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.27,
"r_y0": 300.55,
"r_x1": 229.2,
"r_y1": 300.55,
"r_x2": 229.2,
"r_y2": 291.7,
"r_x3": 214.27,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 300.77,
"r_x1": 232.19,
"r_y1": 300.77,
"r_x2": 232.19,
"r_y2": 291.86,
"r_x3": 229.7,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.49,
"r_y0": 300.55,
"r_x1": 251.42,
"r_y1": 300.55,
"r_x2": 251.42,
"r_y2": 291.7,
"r_x3": 236.49,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.81,
"r_y0": 300.77,
"r_x1": 286.36,
"r_y1": 300.77,
"r_x2": 286.36,
"r_y2": 291.86,
"r_x3": 254.81,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": "consists",
"orig": "consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.72,
"r_x1": 137.45,
"r_y1": 312.72,
"r_x2": 137.45,
"r_y2": 303.82,
"r_x3": 50.11,
"r_y3": 303.82,
"coord_origin": "TOPLEFT"
},
"text": "of the generally used",
"orig": "of the generally used",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 141.3,
"r_y0": 312.5,
"r_x1": 148.24,
"r_y1": 312.5,
"r_x2": 148.24,
"r_y2": 303.66,
"r_x3": 141.3,
"r_y3": 303.66,
"coord_origin": "TOPLEFT"
},
"text": "l$_{1}$",
"orig": "l$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.59,
"r_y0": 312.72,
"r_x1": 286.36,
"r_y1": 312.72,
"r_x2": 286.36,
"r_y2": 303.82,
"r_x3": 152.59,
"r_y3": 303.82,
"coord_origin": "TOPLEFT"
},
"text": "loss for object detection and the",
"orig": "loss for object detection and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.68,
"r_x1": 89.68,
"r_y1": 324.68,
"r_x2": 89.68,
"r_y2": 315.77,
"r_x3": 50.11,
"r_y3": 315.77,
"coord_origin": "TOPLEFT"
},
"text": "IoU loss (",
"orig": "IoU loss (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.69,
"r_y0": 324.46,
"r_x1": 104.12,
"r_y1": 324.46,
"r_x2": 104.12,
"r_y2": 315.61,
"r_x3": 89.69,
"r_y3": 315.61,
"coord_origin": "TOPLEFT"
},
"text": "l$_{iou}$",
"orig": "l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.62,
"r_y0": 324.68,
"r_x1": 286.37,
"r_y1": 324.68,
"r_x2": 286.37,
"r_y2": 315.77,
"r_x3": 104.62,
"r_y3": 315.77,
"coord_origin": "TOPLEFT"
},
"text": ") to be scale invariant as explained in [25]. In",
"orig": ") to be scale invariant as explained in [25]. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.64,
"r_x1": 286.37,
"r_y1": 336.64,
"r_x2": 286.37,
"r_y2": 327.73,
"r_x3": 50.11,
"r_y3": 327.73,
"coord_origin": "TOPLEFT"
},
"text": "comparison to DETR, we do not use the Hungarian algo-",
"orig": "comparison to DETR, we do not use the Hungarian algo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.59,
"r_x1": 286.37,
"r_y1": 348.59,
"r_x2": 286.37,
"r_y2": 339.68,
"r_x3": 50.11,
"r_y3": 339.68,
"coord_origin": "TOPLEFT"
},
"text": "rithm [15] to match the predicted bounding boxes with the",
"orig": "rithm [15] to match the predicted bounding boxes with the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 360.54,
"r_x1": 286.37,
"r_y1": 360.54,
"r_x2": 286.37,
"r_y2": 351.64,
"r_x3": 50.11,
"r_y3": 351.64,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth boxes, as we have already achieved a one-to-",
"orig": "ground-truth boxes, as we have already achieved a one-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 372.5,
"r_x1": 286.37,
"r_y1": 372.5,
"r_x2": 286.37,
"r_y2": 363.59,
"r_x3": 50.11,
"r_y3": 363.59,
"coord_origin": "TOPLEFT"
},
"text": "one match through two steps: 1) Our token input sequence",
"orig": "one match through two steps: 1) Our token input sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 384.45,
"r_x1": 286.37,
"r_y1": 384.45,
"r_x2": 286.37,
"r_y2": 375.55,
"r_x3": 50.11,
"r_y3": 375.55,
"coord_origin": "TOPLEFT"
},
"text": "is naturally ordered, therefore the hidden states of the table",
"orig": "is naturally ordered, therefore the hidden states of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.41,
"r_x1": 286.37,
"r_y1": 396.41,
"r_x2": 286.37,
"r_y2": 387.5,
"r_x3": 50.11,
"r_y3": 387.5,
"coord_origin": "TOPLEFT"
},
"text": "data cells are also in order when they are provided as in-",
"orig": "data cells are also in order when they are provided as in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 408.37,
"r_x1": 88.69,
"r_y1": 408.37,
"r_x2": 88.69,
"r_y2": 399.46,
"r_x3": 50.11,
"r_y3": 399.46,
"coord_origin": "TOPLEFT"
},
"text": "put to the",
"orig": "put to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.65,
"r_y0": 408.14,
"r_x1": 170.05,
"r_y1": 408.14,
"r_x2": 170.05,
"r_y2": 399.55,
"r_x3": 91.65,
"r_y3": 399.55,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.05,
"r_y0": 408.37,
"r_x1": 286.36,
"r_y1": 408.37,
"r_x2": 286.36,
"r_y2": 399.46,
"r_x3": 170.05,
"r_y3": 399.46,
"coord_origin": "TOPLEFT"
},
"text": ", and 2) Our bounding boxes",
"orig": ", and 2) Our bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 420.32,
"r_x1": 181.97,
"r_y1": 420.32,
"r_x2": 181.97,
"r_y2": 411.41,
"r_x3": 50.11,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "generation mechanism (see Sec.",
"orig": "generation mechanism (see Sec.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.09,
"r_y0": 420.32,
"r_x1": 197.75,
"r_y1": 420.32,
"r_x2": 197.75,
"r_y2": 411.41,
"r_x3": 189.09,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "3)",
"orig": "3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.35,
"r_y0": 420.32,
"r_x1": 286.37,
"r_y1": 420.32,
"r_x2": 286.37,
"r_y2": 411.41,
"r_x3": 200.35,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "ensures a one-to-one",
"orig": "ensures a one-to-one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 432.28,
"r_x1": 286.37,
"r_y1": 432.28,
"r_x2": 286.37,
"r_y2": 423.37,
"r_x3": 50.11,
"r_y3": 423.37,
"coord_origin": "TOPLEFT"
},
"text": "mapping between the cell content and its bounding box for",
"orig": "mapping between the cell content and its bounding box for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 444.23,
"r_x1": 158.3,
"r_y1": 444.23,
"r_x2": 158.3,
"r_y2": 435.32,
"r_x3": 50.11,
"r_y3": 435.32,
"coord_origin": "TOPLEFT"
},
"text": "all post-processed datasets.",
"orig": "all post-processed datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 456.92,
"r_x1": 286.36,
"r_y1": 456.92,
"r_x2": 286.36,
"r_y2": 448.01,
"r_x3": 62.07,
"r_y3": 448.01,
"coord_origin": "TOPLEFT"
},
"text": "The loss used to train the TableFormer can be defined as",
"orig": "The loss used to train the TableFormer can be defined as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 468.87,
"r_x1": 91.38,
"r_y1": 468.87,
"r_x2": 91.38,
"r_y2": 459.97,
"r_x3": 50.11,
"r_y3": 459.97,
"coord_origin": "TOPLEFT"
},
"text": "following:",
"orig": "following:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.72,
"r_y0": 502.13,
"r_x1": 140.64,
"r_y1": 502.13,
"r_x2": 140.64,
"r_y2": 493.28,
"r_x3": 125.72,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.91,
"r_y0": 502.13,
"r_x1": 151.66,
"r_y1": 502.13,
"r_x2": 151.66,
"r_y2": 493.28,
"r_x3": 143.91,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.42,
"r_y0": 502.13,
"r_x1": 186.63,
"r_y1": 502.13,
"r_x2": 186.63,
"r_y2": 493.28,
"r_x3": 154.42,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$l$_{iou}$",
"orig": "\u03bb$_{iou}$l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.34,
"r_y0": 502.13,
"r_x1": 197.09,
"r_y1": 502.13,
"r_x2": 197.09,
"r_y2": 493.28,
"r_x3": 189.34,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "+",
"orig": "+",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.3,
"r_y0": 502.13,
"r_x1": 211.65,
"r_y1": 502.13,
"r_x2": 211.65,
"r_y2": 493.28,
"r_x3": 199.3,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.33,
"r_y0": 517.07,
"r_x1": 127.3,
"r_y1": 517.07,
"r_x2": 127.3,
"r_y2": 508.22,
"r_x3": 124.33,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "l",
"orig": "l",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.27,
"r_y0": 517.07,
"r_x1": 138.01,
"r_y1": 517.07,
"r_x2": 138.01,
"r_y2": 508.22,
"r_x3": 130.27,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.78,
"r_y0": 517.07,
"r_x1": 153.33,
"r_y1": 517.07,
"r_x2": 153.33,
"r_y2": 508.22,
"r_x3": 140.78,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "\u03bbl$_{s}$",
"orig": "\u03bbl$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.04,
"r_y0": 517.07,
"r_x1": 174.86,
"r_y1": 517.07,
"r_x2": 174.86,
"r_y2": 508.22,
"r_x3": 156.04,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "+ (1",
"orig": "+ (1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 177.07,
"r_y0": 517.07,
"r_x1": 184.82,
"r_y1": 517.07,
"r_x2": 184.82,
"r_y2": 507.67,
"r_x3": 177.07,
"r_y3": 507.67,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.03,
"r_y0": 517.07,
"r_x1": 192.84,
"r_y1": 517.07,
"r_x2": 192.84,
"r_y2": 508.22,
"r_x3": 187.03,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 192.85,
"r_y0": 517.07,
"r_x1": 196.72,
"r_y1": 517.07,
"r_x2": 196.72,
"r_y2": 508.22,
"r_x3": 192.85,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.72,
"r_y0": 517.07,
"r_x1": 211.65,
"r_y1": 517.07,
"r_x2": 211.65,
"r_y2": 508.22,
"r_x3": 196.72,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 509.92,
"r_x1": 286.36,
"r_y1": 509.92,
"r_x2": 286.36,
"r_y2": 501.01,
"r_x3": 274.75,
"r_y3": 501.01,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 540.22,
"r_x1": 74.45,
"r_y1": 540.22,
"r_x2": 74.45,
"r_y2": 531.31,
"r_x3": 50.11,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.94,
"r_y0": 540.0,
"r_x1": 82.75,
"r_y1": 540.0,
"r_x2": 82.75,
"r_y2": 531.15,
"r_x3": 76.94,
"r_y3": 531.15,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.52,
"r_y0": 540.0,
"r_x1": 92.16,
"r_y1": 540.0,
"r_x2": 92.16,
"r_y2": 530.59,
"r_x3": 85.52,
"r_y3": 530.59,
"coord_origin": "TOPLEFT"
},
"text": "\u2208",
"orig": "\u2208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.65,
"r_y0": 540.22,
"r_x1": 135.6,
"r_y1": 540.22,
"r_x2": 135.6,
"r_y2": 531.31,
"r_x3": 94.65,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "[0, 1], and",
"orig": "[0, 1], and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.09,
"r_y0": 540.0,
"r_x1": 172.63,
"r_y1": 540.0,
"r_x2": 172.63,
"r_y2": 531.15,
"r_x3": 138.09,
"r_y3": 531.15,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.9,
"r_y0": 540.0,
"r_x1": 192.5,
"r_y1": 540.0,
"r_x2": 192.5,
"r_y2": 530.59,
"r_x3": 175.9,
"r_y3": 530.59,
"coord_origin": "TOPLEFT"
},
"text": "\u2208$_{R}$",
"orig": "\u2208$_{R}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 194.99,
"r_y0": 540.22,
"r_x1": 281.6,
"r_y1": 540.22,
"r_x2": 281.6,
"r_y2": 531.31,
"r_x3": 194.99,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "are hyper-parameters.",
"orig": "are hyper-parameters.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 566.66,
"r_x1": 57.93,
"r_y1": 566.66,
"r_x2": 57.93,
"r_y2": 555.92,
"r_x3": 50.11,
"r_y3": 555.92,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.35,
"r_y0": 566.66,
"r_x1": 171.98,
"r_y1": 566.66,
"r_x2": 171.98,
"r_y2": 555.92,
"r_x3": 68.35,
"r_y3": 555.92,
"coord_origin": "TOPLEFT"
},
"text": "Experimental Results",
"orig": "Experimental Results",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 586.12,
"r_x1": 64.69,
"r_y1": 586.12,
"r_x2": 64.69,
"r_y2": 576.26,
"r_x3": 50.11,
"r_y3": 576.26,
"coord_origin": "TOPLEFT"
},
"text": "5.1.",
"orig": "5.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.41,
"r_y0": 586.12,
"r_x1": 179.18,
"r_y1": 586.12,
"r_x2": 179.18,
"r_y2": 576.26,
"r_x3": 74.41,
"r_y3": 576.26,
"coord_origin": "TOPLEFT"
},
"text": "Implementation Details",
"orig": "Implementation Details",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 604.64,
"r_x1": 202.98,
"r_y1": 604.64,
"r_x2": 202.98,
"r_y2": 595.73,
"r_x3": 62.07,
"r_y3": 595.73,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer uses ResNet-18 as the",
"orig": "TableFormer uses ResNet-18 as the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.38,
"r_y0": 604.41,
"r_x1": 286.36,
"r_y1": 604.41,
"r_x2": 286.36,
"r_y2": 595.82,
"r_x3": 205.38,
"r_y3": 595.82,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Net-",
"orig": "CNN Backbone Net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 616.37,
"r_x1": 70.04,
"r_y1": 616.37,
"r_x2": 70.04,
"r_y2": 607.78,
"r_x3": 50.11,
"r_y3": 607.78,
"coord_origin": "TOPLEFT"
},
"text": "work",
"orig": "work",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 616.6,
"r_x1": 286.36,
"r_y1": 616.6,
"r_x2": 286.36,
"r_y2": 607.69,
"r_x3": 70.04,
"r_y3": 607.69,
"coord_origin": "TOPLEFT"
},
"text": ". The input images are resized to 448*448 pixels and",
"orig": ". The input images are resized to 448*448 pixels and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 628.55,
"r_x1": 286.37,
"r_y1": 628.55,
"r_x2": 286.37,
"r_y2": 619.64,
"r_x3": 50.11,
"r_y3": 619.64,
"coord_origin": "TOPLEFT"
},
"text": "the feature map has a dimension of 28*28. Additionally, we",
"orig": "the feature map has a dimension of 28*28. Additionally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 640.51,
"r_x1": 207.03,
"r_y1": 640.51,
"r_x2": 207.03,
"r_y2": 631.6,
"r_x3": 50.11,
"r_y3": 631.6,
"coord_origin": "TOPLEFT"
},
"text": "enforce the following input constraints:",
"orig": "enforce the following input constraints:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.66,
"r_y0": 663.45,
"r_x1": 186.02,
"r_y1": 663.45,
"r_x2": 186.02,
"r_y2": 654.55,
"r_x3": 91.66,
"r_y3": 654.55,
"coord_origin": "TOPLEFT"
},
"text": "Image width and height",
"orig": "Image width and height",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.51,
"r_y0": 663.23,
"r_x1": 196.26,
"r_y1": 663.23,
"r_x2": 196.26,
"r_y2": 653.83,
"r_x3": 188.51,
"r_y3": 653.83,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.75,
"r_y0": 663.45,
"r_x1": 244.81,
"r_y1": 663.45,
"r_x2": 244.81,
"r_y2": 654.55,
"r_x3": 198.75,
"r_y3": 654.55,
"coord_origin": "TOPLEFT"
},
"text": "1024 pixels",
"orig": "1024 pixels",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.02,
"r_y0": 678.4,
"r_x1": 186.25,
"r_y1": 678.4,
"r_x2": 186.25,
"r_y2": 669.49,
"r_x3": 101.02,
"r_y3": 669.49,
"coord_origin": "TOPLEFT"
},
"text": "Structural tags length",
"orig": "Structural tags length",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.74,
"r_y0": 678.18,
"r_x1": 196.48,
"r_y1": 678.18,
"r_x2": 196.48,
"r_y2": 668.77,
"r_x3": 188.74,
"r_y3": 668.77,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.98,
"r_y0": 678.4,
"r_x1": 244.81,
"r_y1": 678.4,
"r_x2": 244.81,
"r_y2": 669.49,
"r_x3": 198.98,
"r_y3": 669.49,
"coord_origin": "TOPLEFT"
},
"text": "512 tokens.",
"orig": "512 tokens.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 671.02,
"r_x1": 286.36,
"r_y1": 671.02,
"r_x2": 286.36,
"r_y2": 662.12,
"r_x3": 274.75,
"r_y3": 662.12,
"coord_origin": "TOPLEFT"
},
"text": "(2)",
"orig": "(2)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Although input constraints are used also by other methods,",
"orig": "Although input constraints are used also by other methods,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "such as EDD, ours are less restrictive due to the improved",
"orig": "such as EDD, ours are less restrictive due to the improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 545.12,
"r_y1": 84.11,
"r_x2": 545.12,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "runtime performance and lower memory footprint of Table-",
"orig": "runtime performance and lower memory footprint of Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 339.99,
"r_y1": 96.07,
"r_x2": 339.99,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "Former.",
"orig": "Former.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.89,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 346.89,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "This allows to utilize input samples with longer",
"orig": "This allows to utilize input samples with longer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 492.96,
"r_y1": 108.02,
"r_x2": 492.96,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "sequences and images with larger dimensions.",
"orig": "sequences and images with larger dimensions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 125.14,
"r_x1": 545.11,
"r_y1": 125.14,
"r_x2": 545.11,
"r_y2": 116.23,
"r_x3": 320.82,
"r_y3": 116.23,
"coord_origin": "TOPLEFT"
},
"text": "The Transformer Encoder consists of two \u201cTransformer",
"orig": "The Transformer Encoder consists of two \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 137.09,
"r_x1": 545.12,
"r_y1": 137.09,
"r_x2": 545.12,
"r_y2": 128.18,
"r_x3": 308.86,
"r_y3": 128.18,
"coord_origin": "TOPLEFT"
},
"text": "Encoder Layers\u201d, with an input feature size of 512, feed",
"orig": "Encoder Layers\u201d, with an input feature size of 512, feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 149.05,
"r_x1": 545.12,
"r_y1": 149.05,
"r_x2": 545.12,
"r_y2": 140.14,
"r_x3": 308.86,
"r_y3": 140.14,
"coord_origin": "TOPLEFT"
},
"text": "forward network of 1024, and 4 attention heads. As for the",
"orig": "forward network of 1024, and 4 attention heads. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 161.0,
"r_x1": 545.12,
"r_y1": 161.0,
"r_x2": 545.12,
"r_y2": 152.09,
"r_x3": 308.86,
"r_y3": 152.09,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder it is composed of four \u201cTransformer",
"orig": "Transformer Decoder it is composed of four \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 172.96,
"r_x1": 545.12,
"r_y1": 172.96,
"r_x2": 545.12,
"r_y2": 164.05,
"r_x3": 308.86,
"r_y3": 164.05,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Layers\u201d with similar input and output dimensions",
"orig": "Decoder Layers\u201d with similar input and output dimensions",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 184.91,
"r_x1": 467.22,
"r_y1": 184.91,
"r_x2": 467.22,
"r_y2": 176.01,
"r_x3": 308.86,
"r_y3": 176.01,
"coord_origin": "TOPLEFT"
},
"text": "as the \u201cTransformer Encoder Layers\u201d.",
"orig": "as the \u201cTransformer Encoder Layers\u201d.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.44,
"r_y0": 184.91,
"r_x1": 545.12,
"r_y1": 184.91,
"r_x2": 545.12,
"r_y2": 176.01,
"r_x3": 475.44,
"r_y3": 176.01,
"coord_origin": "TOPLEFT"
},
"text": "Even though our",
"orig": "Even though our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 196.87,
"r_x1": 545.12,
"r_y1": 196.87,
"r_x2": 545.12,
"r_y2": 187.96,
"r_x3": 308.86,
"r_y3": 187.96,
"coord_origin": "TOPLEFT"
},
"text": "model uses fewer layers and heads than the default imple-",
"orig": "model uses fewer layers and heads than the default imple-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 208.82,
"r_x1": 545.12,
"r_y1": 208.82,
"r_x2": 545.12,
"r_y2": 199.92,
"r_x3": 308.86,
"r_y3": 199.92,
"coord_origin": "TOPLEFT"
},
"text": "mentation parameters, our extensive experimentation has",
"orig": "mentation parameters, our extensive experimentation has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 220.78,
"r_x1": 545.12,
"r_y1": 220.78,
"r_x2": 545.12,
"r_y2": 211.87,
"r_x3": 308.86,
"r_y3": 211.87,
"coord_origin": "TOPLEFT"
},
"text": "proved this setup to be more suitable for table images. We",
"orig": "proved this setup to be more suitable for table images. We",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 232.73,
"r_x1": 545.12,
"r_y1": 232.73,
"r_x2": 545.12,
"r_y2": 223.83,
"r_x3": 308.86,
"r_y3": 223.83,
"coord_origin": "TOPLEFT"
},
"text": "attribute this finding to the inherent design of table im-",
"orig": "attribute this finding to the inherent design of table im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 244.69,
"r_x1": 545.12,
"r_y1": 244.69,
"r_x2": 545.12,
"r_y2": 235.78,
"r_x3": 308.86,
"r_y3": 235.78,
"coord_origin": "TOPLEFT"
},
"text": "ages, which contain mostly lines and text, unlike the more",
"orig": "ages, which contain mostly lines and text, unlike the more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 256.64,
"r_x1": 545.12,
"r_y1": 256.64,
"r_x2": 545.12,
"r_y2": 247.74,
"r_x3": 308.86,
"r_y3": 247.74,
"coord_origin": "TOPLEFT"
},
"text": "elaborate content present in other scopes (e.g. the COCO",
"orig": "elaborate content present in other scopes (e.g. the COCO",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 268.6,
"r_x1": 342.34,
"r_y1": 268.6,
"r_x2": 342.34,
"r_y2": 259.69,
"r_x3": 308.86,
"r_y3": 259.69,
"coord_origin": "TOPLEFT"
},
"text": "dataset).",
"orig": "dataset).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.95,
"r_y0": 268.6,
"r_x1": 545.12,
"r_y1": 268.6,
"r_x2": 545.12,
"r_y2": 259.69,
"r_x3": 348.95,
"r_y3": 259.69,
"coord_origin": "TOPLEFT"
},
"text": "Moreover, we have added ResNet blocks to the",
"orig": "Moreover, we have added ResNet blocks to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 280.55,
"r_x1": 545.12,
"r_y1": 280.55,
"r_x2": 545.12,
"r_y2": 271.65,
"r_x3": 308.86,
"r_y3": 271.65,
"coord_origin": "TOPLEFT"
},
"text": "inputs of the Structure Decoder and Cell BBox Decoder.",
"orig": "inputs of the Structure Decoder and Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 292.51,
"r_x1": 545.12,
"r_y1": 292.51,
"r_x2": 545.12,
"r_y2": 283.6,
"r_x3": 308.86,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "This prevents a decoder having a stronger influence over the",
"orig": "This prevents a decoder having a stronger influence over the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.46,
"r_x1": 545.12,
"r_y1": 304.46,
"r_x2": 545.12,
"r_y2": 295.56,
"r_x3": 308.86,
"r_y3": 295.56,
"coord_origin": "TOPLEFT"
},
"text": "learned weights which would damage the other prediction",
"orig": "learned weights which would damage the other prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.42,
"r_x1": 545.12,
"r_y1": 316.42,
"r_x2": 545.12,
"r_y2": 307.51,
"r_x3": 308.86,
"r_y3": 307.51,
"coord_origin": "TOPLEFT"
},
"text": "task (structure vs bounding boxes), but learn task specific",
"orig": "task (structure vs bounding boxes), but learn task specific",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 328.37,
"r_x1": 532.48,
"r_y1": 328.37,
"r_x2": 532.48,
"r_y2": 319.47,
"r_x3": 308.86,
"r_y3": 319.47,
"coord_origin": "TOPLEFT"
},
"text": "weights instead. Lastly our dropout layers are set to 0.5.",
"orig": "weights instead. Lastly our dropout layers are set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 345.48,
"r_x1": 545.11,
"r_y1": 345.48,
"r_x2": 545.11,
"r_y2": 336.58,
"r_x3": 320.82,
"r_y3": 336.58,
"coord_origin": "TOPLEFT"
},
"text": "For training, TableFormer is trained with 3 Adam opti-",
"orig": "For training, TableFormer is trained with 3 Adam opti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 357.44,
"r_x1": 403.74,
"r_y1": 357.44,
"r_x2": 403.74,
"r_y2": 348.53,
"r_x3": 308.86,
"r_y3": 348.53,
"coord_origin": "TOPLEFT"
},
"text": "mizers, each one for the",
"orig": "mizers, each one for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.08,
"r_y0": 357.21,
"r_x1": 503.54,
"r_y1": 357.21,
"r_x2": 503.54,
"r_y2": 348.62,
"r_x3": 406.08,
"r_y3": 348.62,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 503.54,
"r_y0": 357.44,
"r_x1": 506.03,
"r_y1": 357.44,
"r_x2": 506.03,
"r_y2": 348.53,
"r_x3": 503.54,
"r_y3": 348.53,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.4,
"r_y0": 357.21,
"r_x1": 545.11,
"r_y1": 357.21,
"r_x2": 545.11,
"r_y2": 348.62,
"r_x3": 508.4,
"r_y3": 348.62,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 369.16,
"r_x1": 343.16,
"r_y1": 369.16,
"r_x2": 343.16,
"r_y2": 360.58,
"r_x3": 308.86,
"r_y3": 360.58,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.16,
"r_y0": 369.39,
"r_x1": 362.2,
"r_y1": 369.39,
"r_x2": 362.2,
"r_y2": 360.49,
"r_x3": 343.16,
"r_y3": 360.49,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 364.29,
"r_y0": 369.16,
"r_x1": 440.94,
"r_y1": 369.16,
"r_x2": 440.94,
"r_y2": 360.58,
"r_x3": 364.29,
"r_y3": 360.58,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.94,
"r_y0": 369.39,
"r_x1": 545.11,
"r_y1": 369.39,
"r_x2": 545.11,
"r_y2": 360.49,
"r_x3": 440.94,
"r_y3": 360.49,
"coord_origin": "TOPLEFT"
},
"text": ". Taking the PubTabNet as",
"orig": ". Taking the PubTabNet as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 381.35,
"r_x1": 545.12,
"r_y1": 381.35,
"r_x2": 545.12,
"r_y2": 372.44,
"r_x3": 308.86,
"r_y3": 372.44,
"coord_origin": "TOPLEFT"
},
"text": "an example for our parameter set up, the initializing learn-",
"orig": "an example for our parameter set up, the initializing learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 393.31,
"r_x1": 545.12,
"r_y1": 393.31,
"r_x2": 545.12,
"r_y2": 384.4,
"r_x3": 308.86,
"r_y3": 384.4,
"coord_origin": "TOPLEFT"
},
"text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 405.04,
"r_x1": 314.67,
"r_y1": 405.04,
"r_x2": 314.67,
"r_y2": 396.19,
"r_x3": 308.86,
"r_y3": 396.19,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.66,
"r_y0": 405.26,
"r_x1": 360.39,
"r_y1": 405.26,
"r_x2": 360.39,
"r_y2": 396.35,
"r_x3": 318.66,
"r_y3": 396.35,
"coord_origin": "TOPLEFT"
},
"text": "set to 0.5.",
"orig": "set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.96,
"r_y0": 405.26,
"r_x1": 545.11,
"r_y1": 405.26,
"r_x2": 545.11,
"r_y2": 396.35,
"r_x3": 367.96,
"r_y3": 396.35,
"coord_origin": "TOPLEFT"
},
"text": "Afterwards, we reduce the learning rate to",
"orig": "Afterwards, we reduce the learning rate to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 417.21,
"r_x1": 545.12,
"r_y1": 417.21,
"r_x2": 545.12,
"r_y2": 408.31,
"r_x3": 308.86,
"r_y3": 408.31,
"coord_origin": "TOPLEFT"
},
"text": "0.0001, the batch size to 18 and train for 12 more epochs or",
"orig": "0.0001, the batch size to 18 and train for 12 more epochs or",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 429.17,
"r_x1": 360.97,
"r_y1": 429.17,
"r_x2": 360.97,
"r_y2": 420.26,
"r_x3": 308.86,
"r_y3": 420.26,
"coord_origin": "TOPLEFT"
},
"text": "convergence.",
"orig": "convergence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 446.28,
"r_x1": 545.11,
"r_y1": 446.28,
"r_x2": 545.11,
"r_y2": 437.37,
"r_x3": 320.82,
"r_y3": 437.37,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is implemented with PyTorch and Torchvi-",
"orig": "TableFormer is implemented with PyTorch and Torchvi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 458.24,
"r_x1": 384.63,
"r_y1": 458.24,
"r_x2": 384.63,
"r_y2": 449.33,
"r_x3": 308.86,
"r_y3": 449.33,
"coord_origin": "TOPLEFT"
},
"text": "sion libraries [22].",
"orig": "sion libraries [22].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 458.24,
"r_x1": 545.12,
"r_y1": 458.24,
"r_x2": 545.12,
"r_y2": 449.33,
"r_x3": 391.37,
"r_y3": 449.33,
"coord_origin": "TOPLEFT"
},
"text": "To speed up the inference, the image",
"orig": "To speed up the inference, the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 470.19,
"r_x1": 494.01,
"r_y1": 470.19,
"r_x2": 494.01,
"r_y2": 461.28,
"r_x3": 308.86,
"r_y3": 461.28,
"coord_origin": "TOPLEFT"
},
"text": "undergoes a single forward pass through the",
"orig": "undergoes a single forward pass through the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.08,
"r_y0": 469.96,
"r_x1": 545.11,
"r_y1": 469.96,
"r_x2": 545.11,
"r_y2": 461.37,
"r_x3": 498.08,
"r_y3": 461.37,
"coord_origin": "TOPLEFT"
},
"text": "CNN Back-",
"orig": "CNN Back-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 481.92,
"r_x1": 364.44,
"r_y1": 481.92,
"r_x2": 364.44,
"r_y2": 473.33,
"r_x3": 308.86,
"r_y3": 473.33,
"coord_origin": "TOPLEFT"
},
"text": "bone Network",
"orig": "bone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.06,
"r_y0": 482.15,
"r_x1": 545.11,
"r_y1": 482.15,
"r_x2": 545.11,
"r_y2": 473.24,
"r_x3": 367.06,
"r_y3": 473.24,
"coord_origin": "TOPLEFT"
},
"text": "and transformer encoder. This eliminates the",
"orig": "and transformer encoder. This eliminates the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 494.1,
"r_x1": 545.12,
"r_y1": 494.1,
"r_x2": 545.12,
"r_y2": 485.19,
"r_x3": 308.86,
"r_y3": 485.19,
"coord_origin": "TOPLEFT"
},
"text": "overhead of generating the same features for each decoding",
"orig": "overhead of generating the same features for each decoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 506.06,
"r_x1": 545.12,
"r_y1": 506.06,
"r_x2": 545.12,
"r_y2": 497.15,
"r_x3": 308.86,
"r_y3": 497.15,
"coord_origin": "TOPLEFT"
},
"text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 518.01,
"r_x1": 545.12,
"r_y1": 518.01,
"r_x2": 545.12,
"r_y2": 509.11,
"r_x3": 308.86,
"r_y3": 509.11,
"coord_origin": "TOPLEFT"
},
"text": "faster autoregressive decoding. This is achieved by storing",
"orig": "faster autoregressive decoding. This is achieved by storing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 529.97,
"r_x1": 545.12,
"r_y1": 529.97,
"r_x2": 545.12,
"r_y2": 521.06,
"r_x3": 308.86,
"r_y3": 521.06,
"coord_origin": "TOPLEFT"
},
"text": "the features of decoded tokens so we can reuse them for",
"orig": "the features of decoded tokens so we can reuse them for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 541.92,
"r_x1": 545.12,
"r_y1": 541.92,
"r_x2": 545.12,
"r_y2": 533.02,
"r_x3": 308.86,
"r_y3": 533.02,
"coord_origin": "TOPLEFT"
},
"text": "each time step. Therefore, we only compute the attention",
"orig": "each time step. Therefore, we only compute the attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 553.88,
"r_x1": 377.22,
"r_y1": 553.88,
"r_x2": 377.22,
"r_y2": 544.97,
"r_x3": 308.86,
"r_y3": 544.97,
"coord_origin": "TOPLEFT"
},
"text": "for each new tag.",
"orig": "for each new tag.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 589.41,
"r_x1": 323.9,
"r_y1": 589.41,
"r_x2": 323.9,
"r_y2": 579.55,
"r_x3": 308.86,
"r_y3": 579.55,
"coord_origin": "TOPLEFT"
},
"text": "5.2.",
"orig": "5.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.93,
"r_y0": 589.41,
"r_x1": 397.44,
"r_y1": 589.41,
"r_x2": 397.44,
"r_y2": 579.55,
"r_x3": 333.93,
"r_y3": 579.55,
"coord_origin": "TOPLEFT"
},
"text": "Generalization",
"orig": "Generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 612.36,
"r_x1": 545.11,
"r_y1": 612.36,
"r_x2": 545.11,
"r_y2": 603.45,
"r_x3": 320.82,
"r_y3": 603.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is evaluated on three major publicly avail-",
"orig": "TableFormer is evaluated on three major publicly avail-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 624.31,
"r_x1": 545.12,
"r_y1": 624.31,
"r_x2": 545.12,
"r_y2": 615.4,
"r_x3": 308.86,
"r_y3": 615.4,
"coord_origin": "TOPLEFT"
},
"text": "able datasets of different nature to prove the generalization",
"orig": "able datasets of different nature to prove the generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 636.27,
"r_x1": 545.12,
"r_y1": 636.27,
"r_x2": 545.12,
"r_y2": 627.36,
"r_x3": 308.86,
"r_y3": 627.36,
"coord_origin": "TOPLEFT"
},
"text": "and effectiveness of our model. The datasets used for eval-",
"orig": "and effectiveness of our model. The datasets used for eval-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 648.22,
"r_x1": 545.12,
"r_y1": 648.22,
"r_x2": 545.12,
"r_y2": 639.31,
"r_x3": 308.86,
"r_y3": 639.31,
"coord_origin": "TOPLEFT"
},
"text": "uation are the PubTabNet, FinTabNet and TableBank which",
"orig": "uation are the PubTabNet, FinTabNet and TableBank which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 660.18,
"r_x1": 545.12,
"r_y1": 660.18,
"r_x2": 545.12,
"r_y2": 651.27,
"r_x3": 308.86,
"r_y3": 651.27,
"coord_origin": "TOPLEFT"
},
"text": "stem from the scientific, financial and general domains re-",
"orig": "stem from the scientific, financial and general domains re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 672.13,
"r_x1": 350.7,
"r_y1": 672.13,
"r_x2": 350.7,
"r_y2": 663.23,
"r_x3": 308.86,
"r_y3": 663.23,
"coord_origin": "TOPLEFT"
},
"text": "spectively.",
"orig": "spectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 320.82,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "We also share our baseline results on the challenging",
"orig": "We also share our baseline results on the challenging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 396.21,
"r_y1": 701.2,
"r_x2": 396.21,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet dataset.",
"orig": "SynthTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.41,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 406.41,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Throughout our experiments, the",
"orig": "Throughout our experiments, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 495.94,
"r_y1": 713.15,
"r_x2": 495.94,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "same parameters stated in Sec. 5.1 are utilized.",
"orig": "same parameters stated in Sec. 5.1 are utilized.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 155.85,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "tention encoding is then multiplied to the encoded image to",
"orig": "tention encoding is then multiplied to the encoded image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 286.37,
"r_y1": 96.07,
"r_x2": 286.37,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "produce a feature for each table cell. Notice that this is dif-",
"orig": "produce a feature for each table cell. Notice that this is dif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.02,
"r_x1": 286.37,
"r_y1": 108.02,
"r_x2": 286.37,
"r_y2": 99.12,
"r_x3": 50.11,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "ferent than the typical object detection problem where im-",
"orig": "ferent than the typical object detection problem where im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 119.98,
"r_x1": 286.37,
"r_y1": 119.98,
"r_x2": 286.37,
"r_y2": 111.07,
"r_x3": 50.11,
"r_y3": 111.07,
"coord_origin": "TOPLEFT"
},
"text": "balances between the number of detections and the amount",
"orig": "balances between the number of detections and the amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.93,
"r_x1": 286.37,
"r_y1": 131.93,
"r_x2": 286.37,
"r_y2": 123.03,
"r_x3": 50.11,
"r_y3": 123.03,
"coord_origin": "TOPLEFT"
},
"text": "of objects may exist. In our case, we know up front that",
"orig": "of objects may exist. In our case, we know up front that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 143.89,
"r_x1": 286.37,
"r_y1": 143.89,
"r_x2": 286.37,
"r_y2": 134.98,
"r_x3": 50.11,
"r_y3": 134.98,
"coord_origin": "TOPLEFT"
},
"text": "the produced detections always match with the table cells",
"orig": "the produced detections always match with the table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 155.85,
"r_x1": 175.16,
"r_y1": 155.85,
"r_x2": 175.16,
"r_y2": 146.94,
"r_x3": 50.11,
"r_y3": 146.94,
"coord_origin": "TOPLEFT"
},
"text": "in number and correspondence.",
"orig": "in number and correspondence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "text",
"bbox": {
"l": 50.11,
"t": 159.62,
"r": 286.37,
"b": 240.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 168.53,
"r_x1": 286.36,
"r_y1": 168.53,
"r_x2": 286.36,
"r_y2": 159.62,
"r_x3": 62.07,
"r_y3": 159.62,
"coord_origin": "TOPLEFT"
},
"text": "The output features for each table cell are then fed",
"orig": "The output features for each table cell are then fed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 180.49,
"r_x1": 286.37,
"r_y1": 180.49,
"r_x2": 286.37,
"r_y2": 171.58,
"r_x3": 50.11,
"r_y3": 171.58,
"coord_origin": "TOPLEFT"
},
"text": "into the feed-forward network (FFN). The FFN consists",
"orig": "into the feed-forward network (FFN). The FFN consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 192.44,
"r_x1": 286.37,
"r_y1": 192.44,
"r_x2": 286.37,
"r_y2": 183.54,
"r_x3": 50.11,
"r_y3": 183.54,
"coord_origin": "TOPLEFT"
},
"text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 204.4,
"r_x1": 286.37,
"r_y1": 204.4,
"r_x2": 286.37,
"r_y2": 195.49,
"r_x3": 50.11,
"r_y3": 195.49,
"coord_origin": "TOPLEFT"
},
"text": "tion function) that predicts the normalized coordinates for",
"orig": "tion function) that predicts the normalized coordinates for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 216.35,
"r_x1": 286.37,
"r_y1": 216.35,
"r_x2": 286.37,
"r_y2": 207.45,
"r_x3": 50.11,
"r_y3": 207.45,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table cell. Finally, the predicted",
"orig": "the bounding box of each table cell. Finally, the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 228.31,
"r_x1": 286.37,
"r_y1": 228.31,
"r_x2": 286.37,
"r_y2": 219.4,
"r_x3": 50.11,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes are classified based on whether they are",
"orig": "bounding boxes are classified based on whether they are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 240.26,
"r_x1": 181.55,
"r_y1": 240.26,
"r_x2": 181.55,
"r_y2": 231.36,
"r_x3": 50.11,
"r_y3": 231.36,
"coord_origin": "TOPLEFT"
},
"text": "empty or not using a linear layer.",
"orig": "empty or not using a linear layer.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 243.92,
"r": 286.37,
"b": 444.23,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 252.88,
"r_x1": 129.21,
"r_y1": 252.88,
"r_x2": 129.21,
"r_y2": 243.92,
"r_x3": 62.07,
"r_y3": 243.92,
"coord_origin": "TOPLEFT"
},
"text": "Loss Functions.",
"orig": "Loss Functions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.45,
"r_y0": 252.95,
"r_x1": 286.36,
"r_y1": 252.95,
"r_x2": 286.36,
"r_y2": 244.04,
"r_x3": 134.45,
"r_y3": 244.04,
"coord_origin": "TOPLEFT"
},
"text": "We formulate a multi-task loss Eq. 2",
"orig": "We formulate a multi-task loss Eq. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.9,
"r_x1": 286.37,
"r_y1": 264.9,
"r_x2": 286.37,
"r_y2": 256.0,
"r_x3": 50.11,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "to train our network. The Cross-Entropy loss (denoted as",
"orig": "to train our network. The Cross-Entropy loss (denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.64,
"r_x1": 56.85,
"r_y1": 276.64,
"r_x2": 56.85,
"r_y2": 267.79,
"r_x3": 50.11,
"r_y3": 267.79,
"coord_origin": "TOPLEFT"
},
"text": "l$_{s}$",
"orig": "l$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 57.34,
"r_y0": 276.86,
"r_x1": 135.4,
"r_y1": 276.86,
"r_x2": 135.4,
"r_y2": 267.95,
"r_x3": 57.34,
"r_y3": 267.95,
"coord_origin": "TOPLEFT"
},
"text": ") is used to train the",
"orig": ") is used to train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.74,
"r_y0": 276.63,
"r_x1": 211.08,
"r_y1": 276.63,
"r_x2": 211.08,
"r_y2": 268.04,
"r_x3": 137.74,
"r_y3": 268.04,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.64,
"r_y0": 276.86,
"r_x1": 286.36,
"r_y1": 276.86,
"r_x2": 286.36,
"r_y2": 267.95,
"r_x3": 213.64,
"r_y3": 267.95,
"coord_origin": "TOPLEFT"
},
"text": "which predicts the",
"orig": "which predicts the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.81,
"r_x1": 158.82,
"r_y1": 288.81,
"r_x2": 158.82,
"r_y2": 279.91,
"r_x3": 50.11,
"r_y3": 279.91,
"coord_origin": "TOPLEFT"
},
"text": "structure tokens. As for the",
"orig": "structure tokens. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.32,
"r_y0": 288.58,
"r_x1": 238.8,
"r_y1": 288.58,
"r_x2": 238.8,
"r_y2": 280.0,
"r_x3": 161.32,
"r_y3": 280.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.52,
"r_y0": 288.81,
"r_x1": 286.36,
"r_y1": 288.81,
"r_x2": 286.36,
"r_y2": 279.91,
"r_x3": 241.52,
"r_y3": 279.91,
"coord_origin": "TOPLEFT"
},
"text": "it is trained",
"orig": "it is trained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.77,
"r_x1": 211.38,
"r_y1": 300.77,
"r_x2": 211.38,
"r_y2": 291.86,
"r_x3": 50.11,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": "with a combination of losses denoted as",
"orig": "with a combination of losses denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.27,
"r_y0": 300.55,
"r_x1": 229.2,
"r_y1": 300.55,
"r_x2": 229.2,
"r_y2": 291.7,
"r_x3": 214.27,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 300.77,
"r_x1": 232.19,
"r_y1": 300.77,
"r_x2": 232.19,
"r_y2": 291.86,
"r_x3": 229.7,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.49,
"r_y0": 300.55,
"r_x1": 251.42,
"r_y1": 300.55,
"r_x2": 251.42,
"r_y2": 291.7,
"r_x3": 236.49,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.81,
"r_y0": 300.77,
"r_x1": 286.36,
"r_y1": 300.77,
"r_x2": 286.36,
"r_y2": 291.86,
"r_x3": 254.81,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": "consists",
"orig": "consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.72,
"r_x1": 137.45,
"r_y1": 312.72,
"r_x2": 137.45,
"r_y2": 303.82,
"r_x3": 50.11,
"r_y3": 303.82,
"coord_origin": "TOPLEFT"
},
"text": "of the generally used",
"orig": "of the generally used",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 141.3,
"r_y0": 312.5,
"r_x1": 148.24,
"r_y1": 312.5,
"r_x2": 148.24,
"r_y2": 303.66,
"r_x3": 141.3,
"r_y3": 303.66,
"coord_origin": "TOPLEFT"
},
"text": "l$_{1}$",
"orig": "l$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.59,
"r_y0": 312.72,
"r_x1": 286.36,
"r_y1": 312.72,
"r_x2": 286.36,
"r_y2": 303.82,
"r_x3": 152.59,
"r_y3": 303.82,
"coord_origin": "TOPLEFT"
},
"text": "loss for object detection and the",
"orig": "loss for object detection and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.68,
"r_x1": 89.68,
"r_y1": 324.68,
"r_x2": 89.68,
"r_y2": 315.77,
"r_x3": 50.11,
"r_y3": 315.77,
"coord_origin": "TOPLEFT"
},
"text": "IoU loss (",
"orig": "IoU loss (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.69,
"r_y0": 324.46,
"r_x1": 104.12,
"r_y1": 324.46,
"r_x2": 104.12,
"r_y2": 315.61,
"r_x3": 89.69,
"r_y3": 315.61,
"coord_origin": "TOPLEFT"
},
"text": "l$_{iou}$",
"orig": "l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.62,
"r_y0": 324.68,
"r_x1": 286.37,
"r_y1": 324.68,
"r_x2": 286.37,
"r_y2": 315.77,
"r_x3": 104.62,
"r_y3": 315.77,
"coord_origin": "TOPLEFT"
},
"text": ") to be scale invariant as explained in [25]. In",
"orig": ") to be scale invariant as explained in [25]. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.64,
"r_x1": 286.37,
"r_y1": 336.64,
"r_x2": 286.37,
"r_y2": 327.73,
"r_x3": 50.11,
"r_y3": 327.73,
"coord_origin": "TOPLEFT"
},
"text": "comparison to DETR, we do not use the Hungarian algo-",
"orig": "comparison to DETR, we do not use the Hungarian algo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.59,
"r_x1": 286.37,
"r_y1": 348.59,
"r_x2": 286.37,
"r_y2": 339.68,
"r_x3": 50.11,
"r_y3": 339.68,
"coord_origin": "TOPLEFT"
},
"text": "rithm [15] to match the predicted bounding boxes with the",
"orig": "rithm [15] to match the predicted bounding boxes with the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 360.54,
"r_x1": 286.37,
"r_y1": 360.54,
"r_x2": 286.37,
"r_y2": 351.64,
"r_x3": 50.11,
"r_y3": 351.64,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth boxes, as we have already achieved a one-to-",
"orig": "ground-truth boxes, as we have already achieved a one-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 372.5,
"r_x1": 286.37,
"r_y1": 372.5,
"r_x2": 286.37,
"r_y2": 363.59,
"r_x3": 50.11,
"r_y3": 363.59,
"coord_origin": "TOPLEFT"
},
"text": "one match through two steps: 1) Our token input sequence",
"orig": "one match through two steps: 1) Our token input sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 384.45,
"r_x1": 286.37,
"r_y1": 384.45,
"r_x2": 286.37,
"r_y2": 375.55,
"r_x3": 50.11,
"r_y3": 375.55,
"coord_origin": "TOPLEFT"
},
"text": "is naturally ordered, therefore the hidden states of the table",
"orig": "is naturally ordered, therefore the hidden states of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.41,
"r_x1": 286.37,
"r_y1": 396.41,
"r_x2": 286.37,
"r_y2": 387.5,
"r_x3": 50.11,
"r_y3": 387.5,
"coord_origin": "TOPLEFT"
},
"text": "data cells are also in order when they are provided as in-",
"orig": "data cells are also in order when they are provided as in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 408.37,
"r_x1": 88.69,
"r_y1": 408.37,
"r_x2": 88.69,
"r_y2": 399.46,
"r_x3": 50.11,
"r_y3": 399.46,
"coord_origin": "TOPLEFT"
},
"text": "put to the",
"orig": "put to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.65,
"r_y0": 408.14,
"r_x1": 170.05,
"r_y1": 408.14,
"r_x2": 170.05,
"r_y2": 399.55,
"r_x3": 91.65,
"r_y3": 399.55,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.05,
"r_y0": 408.37,
"r_x1": 286.36,
"r_y1": 408.37,
"r_x2": 286.36,
"r_y2": 399.46,
"r_x3": 170.05,
"r_y3": 399.46,
"coord_origin": "TOPLEFT"
},
"text": ", and 2) Our bounding boxes",
"orig": ", and 2) Our bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 420.32,
"r_x1": 181.97,
"r_y1": 420.32,
"r_x2": 181.97,
"r_y2": 411.41,
"r_x3": 50.11,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "generation mechanism (see Sec.",
"orig": "generation mechanism (see Sec.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.09,
"r_y0": 420.32,
"r_x1": 197.75,
"r_y1": 420.32,
"r_x2": 197.75,
"r_y2": 411.41,
"r_x3": 189.09,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "3)",
"orig": "3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.35,
"r_y0": 420.32,
"r_x1": 286.37,
"r_y1": 420.32,
"r_x2": 286.37,
"r_y2": 411.41,
"r_x3": 200.35,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "ensures a one-to-one",
"orig": "ensures a one-to-one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 432.28,
"r_x1": 286.37,
"r_y1": 432.28,
"r_x2": 286.37,
"r_y2": 423.37,
"r_x3": 50.11,
"r_y3": 423.37,
"coord_origin": "TOPLEFT"
},
"text": "mapping between the cell content and its bounding box for",
"orig": "mapping between the cell content and its bounding box for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 444.23,
"r_x1": 158.3,
"r_y1": 444.23,
"r_x2": 158.3,
"r_y2": 435.32,
"r_x3": 50.11,
"r_y3": 435.32,
"coord_origin": "TOPLEFT"
},
"text": "all post-processed datasets.",
"orig": "all post-processed datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 448.01,
"r": 286.36,
"b": 468.87,
"coord_origin": "TOPLEFT"
},
"confidence": 0.972,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 456.92,
"r_x1": 286.36,
"r_y1": 456.92,
"r_x2": 286.36,
"r_y2": 448.01,
"r_x3": 62.07,
"r_y3": 448.01,
"coord_origin": "TOPLEFT"
},
"text": "The loss used to train the TableFormer can be defined as",
"orig": "The loss used to train the TableFormer can be defined as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 468.87,
"r_x1": 91.38,
"r_y1": 468.87,
"r_x2": 91.38,
"r_y2": 459.97,
"r_x3": 50.11,
"r_y3": 459.97,
"coord_origin": "TOPLEFT"
},
"text": "following:",
"orig": "following:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "formula",
"bbox": {
"l": 124.33,
"t": 493.28,
"r": 286.36,
"b": 517.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.72,
"r_y0": 502.13,
"r_x1": 140.64,
"r_y1": 502.13,
"r_x2": 140.64,
"r_y2": 493.28,
"r_x3": 125.72,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.91,
"r_y0": 502.13,
"r_x1": 151.66,
"r_y1": 502.13,
"r_x2": 151.66,
"r_y2": 493.28,
"r_x3": 143.91,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.42,
"r_y0": 502.13,
"r_x1": 186.63,
"r_y1": 502.13,
"r_x2": 186.63,
"r_y2": 493.28,
"r_x3": 154.42,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$l$_{iou}$",
"orig": "\u03bb$_{iou}$l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.34,
"r_y0": 502.13,
"r_x1": 197.09,
"r_y1": 502.13,
"r_x2": 197.09,
"r_y2": 493.28,
"r_x3": 189.34,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "+",
"orig": "+",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.3,
"r_y0": 502.13,
"r_x1": 211.65,
"r_y1": 502.13,
"r_x2": 211.65,
"r_y2": 493.28,
"r_x3": 199.3,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.33,
"r_y0": 517.07,
"r_x1": 127.3,
"r_y1": 517.07,
"r_x2": 127.3,
"r_y2": 508.22,
"r_x3": 124.33,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "l",
"orig": "l",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.27,
"r_y0": 517.07,
"r_x1": 138.01,
"r_y1": 517.07,
"r_x2": 138.01,
"r_y2": 508.22,
"r_x3": 130.27,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.78,
"r_y0": 517.07,
"r_x1": 153.33,
"r_y1": 517.07,
"r_x2": 153.33,
"r_y2": 508.22,
"r_x3": 140.78,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "\u03bbl$_{s}$",
"orig": "\u03bbl$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.04,
"r_y0": 517.07,
"r_x1": 174.86,
"r_y1": 517.07,
"r_x2": 174.86,
"r_y2": 508.22,
"r_x3": 156.04,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "+ (1",
"orig": "+ (1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 177.07,
"r_y0": 517.07,
"r_x1": 184.82,
"r_y1": 517.07,
"r_x2": 184.82,
"r_y2": 507.67,
"r_x3": 177.07,
"r_y3": 507.67,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.03,
"r_y0": 517.07,
"r_x1": 192.84,
"r_y1": 517.07,
"r_x2": 192.84,
"r_y2": 508.22,
"r_x3": 187.03,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 192.85,
"r_y0": 517.07,
"r_x1": 196.72,
"r_y1": 517.07,
"r_x2": 196.72,
"r_y2": 508.22,
"r_x3": 192.85,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.72,
"r_y0": 517.07,
"r_x1": 211.65,
"r_y1": 517.07,
"r_x2": 211.65,
"r_y2": 508.22,
"r_x3": 196.72,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 509.92,
"r_x1": 286.36,
"r_y1": 509.92,
"r_x2": 286.36,
"r_y2": 501.01,
"r_x3": 274.75,
"r_y3": 501.01,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 50.11,
"t": 530.59,
"r": 281.6,
"b": 540.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.936,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 540.22,
"r_x1": 74.45,
"r_y1": 540.22,
"r_x2": 74.45,
"r_y2": 531.31,
"r_x3": 50.11,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.94,
"r_y0": 540.0,
"r_x1": 82.75,
"r_y1": 540.0,
"r_x2": 82.75,
"r_y2": 531.15,
"r_x3": 76.94,
"r_y3": 531.15,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.52,
"r_y0": 540.0,
"r_x1": 92.16,
"r_y1": 540.0,
"r_x2": 92.16,
"r_y2": 530.59,
"r_x3": 85.52,
"r_y3": 530.59,
"coord_origin": "TOPLEFT"
},
"text": "\u2208",
"orig": "\u2208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.65,
"r_y0": 540.22,
"r_x1": 135.6,
"r_y1": 540.22,
"r_x2": 135.6,
"r_y2": 531.31,
"r_x3": 94.65,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "[0, 1], and",
"orig": "[0, 1], and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.09,
"r_y0": 540.0,
"r_x1": 172.63,
"r_y1": 540.0,
"r_x2": 172.63,
"r_y2": 531.15,
"r_x3": 138.09,
"r_y3": 531.15,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.9,
"r_y0": 540.0,
"r_x1": 192.5,
"r_y1": 540.0,
"r_x2": 192.5,
"r_y2": 530.59,
"r_x3": 175.9,
"r_y3": 530.59,
"coord_origin": "TOPLEFT"
},
"text": "\u2208$_{R}$",
"orig": "\u2208$_{R}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 194.99,
"r_y0": 540.22,
"r_x1": 281.6,
"r_y1": 540.22,
"r_x2": 281.6,
"r_y2": 531.31,
"r_x3": 194.99,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "are hyper-parameters.",
"orig": "are hyper-parameters.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 555.92,
"r": 171.98,
"b": 566.66,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 566.66,
"r_x1": 57.93,
"r_y1": 566.66,
"r_x2": 57.93,
"r_y2": 555.92,
"r_x3": 50.11,
"r_y3": 555.92,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.35,
"r_y0": 566.66,
"r_x1": 171.98,
"r_y1": 566.66,
"r_x2": 171.98,
"r_y2": 555.92,
"r_x3": 68.35,
"r_y3": 555.92,
"coord_origin": "TOPLEFT"
},
"text": "Experimental Results",
"orig": "Experimental Results",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 576.26,
"r": 179.18,
"b": 586.12,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 586.12,
"r_x1": 64.69,
"r_y1": 586.12,
"r_x2": 64.69,
"r_y2": 576.26,
"r_x3": 50.11,
"r_y3": 576.26,
"coord_origin": "TOPLEFT"
},
"text": "5.1.",
"orig": "5.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.41,
"r_y0": 586.12,
"r_x1": 179.18,
"r_y1": 586.12,
"r_x2": 179.18,
"r_y2": 576.26,
"r_x3": 74.41,
"r_y3": 576.26,
"coord_origin": "TOPLEFT"
},
"text": "Implementation Details",
"orig": "Implementation Details",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 595.73,
"r": 286.37,
"b": 640.51,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 604.64,
"r_x1": 202.98,
"r_y1": 604.64,
"r_x2": 202.98,
"r_y2": 595.73,
"r_x3": 62.07,
"r_y3": 595.73,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer uses ResNet-18 as the",
"orig": "TableFormer uses ResNet-18 as the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.38,
"r_y0": 604.41,
"r_x1": 286.36,
"r_y1": 604.41,
"r_x2": 286.36,
"r_y2": 595.82,
"r_x3": 205.38,
"r_y3": 595.82,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Net-",
"orig": "CNN Backbone Net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 616.37,
"r_x1": 70.04,
"r_y1": 616.37,
"r_x2": 70.04,
"r_y2": 607.78,
"r_x3": 50.11,
"r_y3": 607.78,
"coord_origin": "TOPLEFT"
},
"text": "work",
"orig": "work",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 616.6,
"r_x1": 286.36,
"r_y1": 616.6,
"r_x2": 286.36,
"r_y2": 607.69,
"r_x3": 70.04,
"r_y3": 607.69,
"coord_origin": "TOPLEFT"
},
"text": ". The input images are resized to 448*448 pixels and",
"orig": ". The input images are resized to 448*448 pixels and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 628.55,
"r_x1": 286.37,
"r_y1": 628.55,
"r_x2": 286.37,
"r_y2": 619.64,
"r_x3": 50.11,
"r_y3": 619.64,
"coord_origin": "TOPLEFT"
},
"text": "the feature map has a dimension of 28*28. Additionally, we",
"orig": "the feature map has a dimension of 28*28. Additionally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 640.51,
"r_x1": 207.03,
"r_y1": 640.51,
"r_x2": 207.03,
"r_y2": 631.6,
"r_x3": 50.11,
"r_y3": 631.6,
"coord_origin": "TOPLEFT"
},
"text": "enforce the following input constraints:",
"orig": "enforce the following input constraints:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "formula",
"bbox": {
"l": 91.66,
"t": 653.83,
"r": 286.36,
"b": 678.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.844,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.66,
"r_y0": 663.45,
"r_x1": 186.02,
"r_y1": 663.45,
"r_x2": 186.02,
"r_y2": 654.55,
"r_x3": 91.66,
"r_y3": 654.55,
"coord_origin": "TOPLEFT"
},
"text": "Image width and height",
"orig": "Image width and height",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.51,
"r_y0": 663.23,
"r_x1": 196.26,
"r_y1": 663.23,
"r_x2": 196.26,
"r_y2": 653.83,
"r_x3": 188.51,
"r_y3": 653.83,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.75,
"r_y0": 663.45,
"r_x1": 244.81,
"r_y1": 663.45,
"r_x2": 244.81,
"r_y2": 654.55,
"r_x3": 198.75,
"r_y3": 654.55,
"coord_origin": "TOPLEFT"
},
"text": "1024 pixels",
"orig": "1024 pixels",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.02,
"r_y0": 678.4,
"r_x1": 186.25,
"r_y1": 678.4,
"r_x2": 186.25,
"r_y2": 669.49,
"r_x3": 101.02,
"r_y3": 669.49,
"coord_origin": "TOPLEFT"
},
"text": "Structural tags length",
"orig": "Structural tags length",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.74,
"r_y0": 678.18,
"r_x1": 196.48,
"r_y1": 678.18,
"r_x2": 196.48,
"r_y2": 668.77,
"r_x3": 188.74,
"r_y3": 668.77,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.98,
"r_y0": 678.4,
"r_x1": 244.81,
"r_y1": 678.4,
"r_x2": 244.81,
"r_y2": 669.49,
"r_x3": 198.98,
"r_y3": 669.49,
"coord_origin": "TOPLEFT"
},
"text": "512 tokens.",
"orig": "512 tokens.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 671.02,
"r_x1": 286.36,
"r_y1": 671.02,
"r_x2": 286.36,
"r_y2": 662.12,
"r_x3": 274.75,
"r_y3": 662.12,
"coord_origin": "TOPLEFT"
},
"text": "(2)",
"orig": "(2)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 692.29,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.972,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Although input constraints are used also by other methods,",
"orig": "Although input constraints are used also by other methods,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "such as EDD, ours are less restrictive due to the improved",
"orig": "such as EDD, ours are less restrictive due to the improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 545.12,
"r_y1": 84.11,
"r_x2": 545.12,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "runtime performance and lower memory footprint of Table-",
"orig": "runtime performance and lower memory footprint of Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 339.99,
"r_y1": 96.07,
"r_x2": 339.99,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "Former.",
"orig": "Former.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.89,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 346.89,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "This allows to utilize input samples with longer",
"orig": "This allows to utilize input samples with longer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 492.96,
"r_y1": 108.02,
"r_x2": 492.96,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "sequences and images with larger dimensions.",
"orig": "sequences and images with larger dimensions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 116.23,
"r": 545.12,
"b": 328.37,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 125.14,
"r_x1": 545.11,
"r_y1": 125.14,
"r_x2": 545.11,
"r_y2": 116.23,
"r_x3": 320.82,
"r_y3": 116.23,
"coord_origin": "TOPLEFT"
},
"text": "The Transformer Encoder consists of two \u201cTransformer",
"orig": "The Transformer Encoder consists of two \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 137.09,
"r_x1": 545.12,
"r_y1": 137.09,
"r_x2": 545.12,
"r_y2": 128.18,
"r_x3": 308.86,
"r_y3": 128.18,
"coord_origin": "TOPLEFT"
},
"text": "Encoder Layers\u201d, with an input feature size of 512, feed",
"orig": "Encoder Layers\u201d, with an input feature size of 512, feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 149.05,
"r_x1": 545.12,
"r_y1": 149.05,
"r_x2": 545.12,
"r_y2": 140.14,
"r_x3": 308.86,
"r_y3": 140.14,
"coord_origin": "TOPLEFT"
},
"text": "forward network of 1024, and 4 attention heads. As for the",
"orig": "forward network of 1024, and 4 attention heads. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 161.0,
"r_x1": 545.12,
"r_y1": 161.0,
"r_x2": 545.12,
"r_y2": 152.09,
"r_x3": 308.86,
"r_y3": 152.09,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder it is composed of four \u201cTransformer",
"orig": "Transformer Decoder it is composed of four \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 172.96,
"r_x1": 545.12,
"r_y1": 172.96,
"r_x2": 545.12,
"r_y2": 164.05,
"r_x3": 308.86,
"r_y3": 164.05,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Layers\u201d with similar input and output dimensions",
"orig": "Decoder Layers\u201d with similar input and output dimensions",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 184.91,
"r_x1": 467.22,
"r_y1": 184.91,
"r_x2": 467.22,
"r_y2": 176.01,
"r_x3": 308.86,
"r_y3": 176.01,
"coord_origin": "TOPLEFT"
},
"text": "as the \u201cTransformer Encoder Layers\u201d.",
"orig": "as the \u201cTransformer Encoder Layers\u201d.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.44,
"r_y0": 184.91,
"r_x1": 545.12,
"r_y1": 184.91,
"r_x2": 545.12,
"r_y2": 176.01,
"r_x3": 475.44,
"r_y3": 176.01,
"coord_origin": "TOPLEFT"
},
"text": "Even though our",
"orig": "Even though our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 196.87,
"r_x1": 545.12,
"r_y1": 196.87,
"r_x2": 545.12,
"r_y2": 187.96,
"r_x3": 308.86,
"r_y3": 187.96,
"coord_origin": "TOPLEFT"
},
"text": "model uses fewer layers and heads than the default imple-",
"orig": "model uses fewer layers and heads than the default imple-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 208.82,
"r_x1": 545.12,
"r_y1": 208.82,
"r_x2": 545.12,
"r_y2": 199.92,
"r_x3": 308.86,
"r_y3": 199.92,
"coord_origin": "TOPLEFT"
},
"text": "mentation parameters, our extensive experimentation has",
"orig": "mentation parameters, our extensive experimentation has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 220.78,
"r_x1": 545.12,
"r_y1": 220.78,
"r_x2": 545.12,
"r_y2": 211.87,
"r_x3": 308.86,
"r_y3": 211.87,
"coord_origin": "TOPLEFT"
},
"text": "proved this setup to be more suitable for table images. We",
"orig": "proved this setup to be more suitable for table images. We",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 232.73,
"r_x1": 545.12,
"r_y1": 232.73,
"r_x2": 545.12,
"r_y2": 223.83,
"r_x3": 308.86,
"r_y3": 223.83,
"coord_origin": "TOPLEFT"
},
"text": "attribute this finding to the inherent design of table im-",
"orig": "attribute this finding to the inherent design of table im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 244.69,
"r_x1": 545.12,
"r_y1": 244.69,
"r_x2": 545.12,
"r_y2": 235.78,
"r_x3": 308.86,
"r_y3": 235.78,
"coord_origin": "TOPLEFT"
},
"text": "ages, which contain mostly lines and text, unlike the more",
"orig": "ages, which contain mostly lines and text, unlike the more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 256.64,
"r_x1": 545.12,
"r_y1": 256.64,
"r_x2": 545.12,
"r_y2": 247.74,
"r_x3": 308.86,
"r_y3": 247.74,
"coord_origin": "TOPLEFT"
},
"text": "elaborate content present in other scopes (e.g. the COCO",
"orig": "elaborate content present in other scopes (e.g. the COCO",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 268.6,
"r_x1": 342.34,
"r_y1": 268.6,
"r_x2": 342.34,
"r_y2": 259.69,
"r_x3": 308.86,
"r_y3": 259.69,
"coord_origin": "TOPLEFT"
},
"text": "dataset).",
"orig": "dataset).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.95,
"r_y0": 268.6,
"r_x1": 545.12,
"r_y1": 268.6,
"r_x2": 545.12,
"r_y2": 259.69,
"r_x3": 348.95,
"r_y3": 259.69,
"coord_origin": "TOPLEFT"
},
"text": "Moreover, we have added ResNet blocks to the",
"orig": "Moreover, we have added ResNet blocks to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 280.55,
"r_x1": 545.12,
"r_y1": 280.55,
"r_x2": 545.12,
"r_y2": 271.65,
"r_x3": 308.86,
"r_y3": 271.65,
"coord_origin": "TOPLEFT"
},
"text": "inputs of the Structure Decoder and Cell BBox Decoder.",
"orig": "inputs of the Structure Decoder and Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 292.51,
"r_x1": 545.12,
"r_y1": 292.51,
"r_x2": 545.12,
"r_y2": 283.6,
"r_x3": 308.86,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "This prevents a decoder having a stronger influence over the",
"orig": "This prevents a decoder having a stronger influence over the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.46,
"r_x1": 545.12,
"r_y1": 304.46,
"r_x2": 545.12,
"r_y2": 295.56,
"r_x3": 308.86,
"r_y3": 295.56,
"coord_origin": "TOPLEFT"
},
"text": "learned weights which would damage the other prediction",
"orig": "learned weights which would damage the other prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.42,
"r_x1": 545.12,
"r_y1": 316.42,
"r_x2": 545.12,
"r_y2": 307.51,
"r_x3": 308.86,
"r_y3": 307.51,
"coord_origin": "TOPLEFT"
},
"text": "task (structure vs bounding boxes), but learn task specific",
"orig": "task (structure vs bounding boxes), but learn task specific",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 328.37,
"r_x1": 532.48,
"r_y1": 328.37,
"r_x2": 532.48,
"r_y2": 319.47,
"r_x3": 308.86,
"r_y3": 319.47,
"coord_origin": "TOPLEFT"
},
"text": "weights instead. Lastly our dropout layers are set to 0.5.",
"orig": "weights instead. Lastly our dropout layers are set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 336.58,
"r": 545.12,
"b": 429.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 345.48,
"r_x1": 545.11,
"r_y1": 345.48,
"r_x2": 545.11,
"r_y2": 336.58,
"r_x3": 320.82,
"r_y3": 336.58,
"coord_origin": "TOPLEFT"
},
"text": "For training, TableFormer is trained with 3 Adam opti-",
"orig": "For training, TableFormer is trained with 3 Adam opti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 357.44,
"r_x1": 403.74,
"r_y1": 357.44,
"r_x2": 403.74,
"r_y2": 348.53,
"r_x3": 308.86,
"r_y3": 348.53,
"coord_origin": "TOPLEFT"
},
"text": "mizers, each one for the",
"orig": "mizers, each one for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.08,
"r_y0": 357.21,
"r_x1": 503.54,
"r_y1": 357.21,
"r_x2": 503.54,
"r_y2": 348.62,
"r_x3": 406.08,
"r_y3": 348.62,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 503.54,
"r_y0": 357.44,
"r_x1": 506.03,
"r_y1": 357.44,
"r_x2": 506.03,
"r_y2": 348.53,
"r_x3": 503.54,
"r_y3": 348.53,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.4,
"r_y0": 357.21,
"r_x1": 545.11,
"r_y1": 357.21,
"r_x2": 545.11,
"r_y2": 348.62,
"r_x3": 508.4,
"r_y3": 348.62,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 369.16,
"r_x1": 343.16,
"r_y1": 369.16,
"r_x2": 343.16,
"r_y2": 360.58,
"r_x3": 308.86,
"r_y3": 360.58,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.16,
"r_y0": 369.39,
"r_x1": 362.2,
"r_y1": 369.39,
"r_x2": 362.2,
"r_y2": 360.49,
"r_x3": 343.16,
"r_y3": 360.49,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 364.29,
"r_y0": 369.16,
"r_x1": 440.94,
"r_y1": 369.16,
"r_x2": 440.94,
"r_y2": 360.58,
"r_x3": 364.29,
"r_y3": 360.58,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.94,
"r_y0": 369.39,
"r_x1": 545.11,
"r_y1": 369.39,
"r_x2": 545.11,
"r_y2": 360.49,
"r_x3": 440.94,
"r_y3": 360.49,
"coord_origin": "TOPLEFT"
},
"text": ". Taking the PubTabNet as",
"orig": ". Taking the PubTabNet as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 381.35,
"r_x1": 545.12,
"r_y1": 381.35,
"r_x2": 545.12,
"r_y2": 372.44,
"r_x3": 308.86,
"r_y3": 372.44,
"coord_origin": "TOPLEFT"
},
"text": "an example for our parameter set up, the initializing learn-",
"orig": "an example for our parameter set up, the initializing learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 393.31,
"r_x1": 545.12,
"r_y1": 393.31,
"r_x2": 545.12,
"r_y2": 384.4,
"r_x3": 308.86,
"r_y3": 384.4,
"coord_origin": "TOPLEFT"
},
"text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 405.04,
"r_x1": 314.67,
"r_y1": 405.04,
"r_x2": 314.67,
"r_y2": 396.19,
"r_x3": 308.86,
"r_y3": 396.19,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.66,
"r_y0": 405.26,
"r_x1": 360.39,
"r_y1": 405.26,
"r_x2": 360.39,
"r_y2": 396.35,
"r_x3": 318.66,
"r_y3": 396.35,
"coord_origin": "TOPLEFT"
},
"text": "set to 0.5.",
"orig": "set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.96,
"r_y0": 405.26,
"r_x1": 545.11,
"r_y1": 405.26,
"r_x2": 545.11,
"r_y2": 396.35,
"r_x3": 367.96,
"r_y3": 396.35,
"coord_origin": "TOPLEFT"
},
"text": "Afterwards, we reduce the learning rate to",
"orig": "Afterwards, we reduce the learning rate to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 417.21,
"r_x1": 545.12,
"r_y1": 417.21,
"r_x2": 545.12,
"r_y2": 408.31,
"r_x3": 308.86,
"r_y3": 408.31,
"coord_origin": "TOPLEFT"
},
"text": "0.0001, the batch size to 18 and train for 12 more epochs or",
"orig": "0.0001, the batch size to 18 and train for 12 more epochs or",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 429.17,
"r_x1": 360.97,
"r_y1": 429.17,
"r_x2": 360.97,
"r_y2": 420.26,
"r_x3": 308.86,
"r_y3": 420.26,
"coord_origin": "TOPLEFT"
},
"text": "convergence.",
"orig": "convergence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 437.37,
"r": 545.12,
"b": 553.88,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 446.28,
"r_x1": 545.11,
"r_y1": 446.28,
"r_x2": 545.11,
"r_y2": 437.37,
"r_x3": 320.82,
"r_y3": 437.37,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is implemented with PyTorch and Torchvi-",
"orig": "TableFormer is implemented with PyTorch and Torchvi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 458.24,
"r_x1": 384.63,
"r_y1": 458.24,
"r_x2": 384.63,
"r_y2": 449.33,
"r_x3": 308.86,
"r_y3": 449.33,
"coord_origin": "TOPLEFT"
},
"text": "sion libraries [22].",
"orig": "sion libraries [22].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 458.24,
"r_x1": 545.12,
"r_y1": 458.24,
"r_x2": 545.12,
"r_y2": 449.33,
"r_x3": 391.37,
"r_y3": 449.33,
"coord_origin": "TOPLEFT"
},
"text": "To speed up the inference, the image",
"orig": "To speed up the inference, the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 470.19,
"r_x1": 494.01,
"r_y1": 470.19,
"r_x2": 494.01,
"r_y2": 461.28,
"r_x3": 308.86,
"r_y3": 461.28,
"coord_origin": "TOPLEFT"
},
"text": "undergoes a single forward pass through the",
"orig": "undergoes a single forward pass through the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.08,
"r_y0": 469.96,
"r_x1": 545.11,
"r_y1": 469.96,
"r_x2": 545.11,
"r_y2": 461.37,
"r_x3": 498.08,
"r_y3": 461.37,
"coord_origin": "TOPLEFT"
},
"text": "CNN Back-",
"orig": "CNN Back-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 481.92,
"r_x1": 364.44,
"r_y1": 481.92,
"r_x2": 364.44,
"r_y2": 473.33,
"r_x3": 308.86,
"r_y3": 473.33,
"coord_origin": "TOPLEFT"
},
"text": "bone Network",
"orig": "bone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.06,
"r_y0": 482.15,
"r_x1": 545.11,
"r_y1": 482.15,
"r_x2": 545.11,
"r_y2": 473.24,
"r_x3": 367.06,
"r_y3": 473.24,
"coord_origin": "TOPLEFT"
},
"text": "and transformer encoder. This eliminates the",
"orig": "and transformer encoder. This eliminates the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 494.1,
"r_x1": 545.12,
"r_y1": 494.1,
"r_x2": 545.12,
"r_y2": 485.19,
"r_x3": 308.86,
"r_y3": 485.19,
"coord_origin": "TOPLEFT"
},
"text": "overhead of generating the same features for each decoding",
"orig": "overhead of generating the same features for each decoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 506.06,
"r_x1": 545.12,
"r_y1": 506.06,
"r_x2": 545.12,
"r_y2": 497.15,
"r_x3": 308.86,
"r_y3": 497.15,
"coord_origin": "TOPLEFT"
},
"text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 518.01,
"r_x1": 545.12,
"r_y1": 518.01,
"r_x2": 545.12,
"r_y2": 509.11,
"r_x3": 308.86,
"r_y3": 509.11,
"coord_origin": "TOPLEFT"
},
"text": "faster autoregressive decoding. This is achieved by storing",
"orig": "faster autoregressive decoding. This is achieved by storing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 529.97,
"r_x1": 545.12,
"r_y1": 529.97,
"r_x2": 545.12,
"r_y2": 521.06,
"r_x3": 308.86,
"r_y3": 521.06,
"coord_origin": "TOPLEFT"
},
"text": "the features of decoded tokens so we can reuse them for",
"orig": "the features of decoded tokens so we can reuse them for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 541.92,
"r_x1": 545.12,
"r_y1": 541.92,
"r_x2": 545.12,
"r_y2": 533.02,
"r_x3": 308.86,
"r_y3": 533.02,
"coord_origin": "TOPLEFT"
},
"text": "each time step. Therefore, we only compute the attention",
"orig": "each time step. Therefore, we only compute the attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 553.88,
"r_x1": 377.22,
"r_y1": 553.88,
"r_x2": 377.22,
"r_y2": 544.97,
"r_x3": 308.86,
"r_y3": 544.97,
"coord_origin": "TOPLEFT"
},
"text": "for each new tag.",
"orig": "for each new tag.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 579.55,
"r": 397.44,
"b": 589.41,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 589.41,
"r_x1": 323.9,
"r_y1": 589.41,
"r_x2": 323.9,
"r_y2": 579.55,
"r_x3": 308.86,
"r_y3": 579.55,
"coord_origin": "TOPLEFT"
},
"text": "5.2.",
"orig": "5.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.93,
"r_y0": 589.41,
"r_x1": 397.44,
"r_y1": 589.41,
"r_x2": 397.44,
"r_y2": 579.55,
"r_x3": 333.93,
"r_y3": 579.55,
"coord_origin": "TOPLEFT"
},
"text": "Generalization",
"orig": "Generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 603.45,
"r": 545.12,
"b": 672.13,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 612.36,
"r_x1": 545.11,
"r_y1": 612.36,
"r_x2": 545.11,
"r_y2": 603.45,
"r_x3": 320.82,
"r_y3": 603.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is evaluated on three major publicly avail-",
"orig": "TableFormer is evaluated on three major publicly avail-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 624.31,
"r_x1": 545.12,
"r_y1": 624.31,
"r_x2": 545.12,
"r_y2": 615.4,
"r_x3": 308.86,
"r_y3": 615.4,
"coord_origin": "TOPLEFT"
},
"text": "able datasets of different nature to prove the generalization",
"orig": "able datasets of different nature to prove the generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 636.27,
"r_x1": 545.12,
"r_y1": 636.27,
"r_x2": 545.12,
"r_y2": 627.36,
"r_x3": 308.86,
"r_y3": 627.36,
"coord_origin": "TOPLEFT"
},
"text": "and effectiveness of our model. The datasets used for eval-",
"orig": "and effectiveness of our model. The datasets used for eval-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 648.22,
"r_x1": 545.12,
"r_y1": 648.22,
"r_x2": 545.12,
"r_y2": 639.31,
"r_x3": 308.86,
"r_y3": 639.31,
"coord_origin": "TOPLEFT"
},
"text": "uation are the PubTabNet, FinTabNet and TableBank which",
"orig": "uation are the PubTabNet, FinTabNet and TableBank which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 660.18,
"r_x1": 545.12,
"r_y1": 660.18,
"r_x2": 545.12,
"r_y2": 651.27,
"r_x3": 308.86,
"r_y3": 651.27,
"coord_origin": "TOPLEFT"
},
"text": "stem from the scientific, financial and general domains re-",
"orig": "stem from the scientific, financial and general domains re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 672.13,
"r_x1": 350.7,
"r_y1": 672.13,
"r_x2": 350.7,
"r_y2": 663.23,
"r_x3": 308.86,
"r_y3": 663.23,
"coord_origin": "TOPLEFT"
},
"text": "spectively.",
"orig": "spectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "text",
"bbox": {
"l": 308.86,
"t": 680.34,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 320.82,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "We also share our baseline results on the challenging",
"orig": "We also share our baseline results on the challenging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 396.21,
"r_y1": 701.2,
"r_x2": 396.21,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet dataset.",
"orig": "SynthTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.41,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 406.41,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Throughout our experiments, the",
"orig": "Throughout our experiments, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 495.94,
"r_y1": 713.15,
"r_x2": 495.94,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "same parameters stated in Sec. 5.1 are utilized.",
"orig": "same parameters stated in Sec. 5.1 are utilized.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 5,
"page_no": 5,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 155.85,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "tention encoding is then multiplied to the encoded image to",
"orig": "tention encoding is then multiplied to the encoded image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 286.37,
"r_y1": 96.07,
"r_x2": 286.37,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "produce a feature for each table cell. Notice that this is dif-",
"orig": "produce a feature for each table cell. Notice that this is dif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.02,
"r_x1": 286.37,
"r_y1": 108.02,
"r_x2": 286.37,
"r_y2": 99.12,
"r_x3": 50.11,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "ferent than the typical object detection problem where im-",
"orig": "ferent than the typical object detection problem where im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 119.98,
"r_x1": 286.37,
"r_y1": 119.98,
"r_x2": 286.37,
"r_y2": 111.07,
"r_x3": 50.11,
"r_y3": 111.07,
"coord_origin": "TOPLEFT"
},
"text": "balances between the number of detections and the amount",
"orig": "balances between the number of detections and the amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.93,
"r_x1": 286.37,
"r_y1": 131.93,
"r_x2": 286.37,
"r_y2": 123.03,
"r_x3": 50.11,
"r_y3": 123.03,
"coord_origin": "TOPLEFT"
},
"text": "of objects may exist. In our case, we know up front that",
"orig": "of objects may exist. In our case, we know up front that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 143.89,
"r_x1": 286.37,
"r_y1": 143.89,
"r_x2": 286.37,
"r_y2": 134.98,
"r_x3": 50.11,
"r_y3": 134.98,
"coord_origin": "TOPLEFT"
},
"text": "the produced detections always match with the table cells",
"orig": "the produced detections always match with the table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 155.85,
"r_x1": 175.16,
"r_y1": 155.85,
"r_x2": 175.16,
"r_y2": 146.94,
"r_x3": 50.11,
"r_y3": 146.94,
"coord_origin": "TOPLEFT"
},
"text": "in number and correspondence.",
"orig": "in number and correspondence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence."
},
{
"label": "text",
"id": 6,
"page_no": 5,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 50.11,
"t": 159.62,
"r": 286.37,
"b": 240.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 168.53,
"r_x1": 286.36,
"r_y1": 168.53,
"r_x2": 286.36,
"r_y2": 159.62,
"r_x3": 62.07,
"r_y3": 159.62,
"coord_origin": "TOPLEFT"
},
"text": "The output features for each table cell are then fed",
"orig": "The output features for each table cell are then fed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 180.49,
"r_x1": 286.37,
"r_y1": 180.49,
"r_x2": 286.37,
"r_y2": 171.58,
"r_x3": 50.11,
"r_y3": 171.58,
"coord_origin": "TOPLEFT"
},
"text": "into the feed-forward network (FFN). The FFN consists",
"orig": "into the feed-forward network (FFN). The FFN consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 192.44,
"r_x1": 286.37,
"r_y1": 192.44,
"r_x2": 286.37,
"r_y2": 183.54,
"r_x3": 50.11,
"r_y3": 183.54,
"coord_origin": "TOPLEFT"
},
"text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 204.4,
"r_x1": 286.37,
"r_y1": 204.4,
"r_x2": 286.37,
"r_y2": 195.49,
"r_x3": 50.11,
"r_y3": 195.49,
"coord_origin": "TOPLEFT"
},
"text": "tion function) that predicts the normalized coordinates for",
"orig": "tion function) that predicts the normalized coordinates for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 216.35,
"r_x1": 286.37,
"r_y1": 216.35,
"r_x2": 286.37,
"r_y2": 207.45,
"r_x3": 50.11,
"r_y3": 207.45,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table cell. Finally, the predicted",
"orig": "the bounding box of each table cell. Finally, the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 228.31,
"r_x1": 286.37,
"r_y1": 228.31,
"r_x2": 286.37,
"r_y2": 219.4,
"r_x3": 50.11,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes are classified based on whether they are",
"orig": "bounding boxes are classified based on whether they are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 240.26,
"r_x1": 181.55,
"r_y1": 240.26,
"r_x2": 181.55,
"r_y2": 231.36,
"r_x3": 50.11,
"r_y3": 231.36,
"coord_origin": "TOPLEFT"
},
"text": "empty or not using a linear layer.",
"orig": "empty or not using a linear layer.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer."
},
{
"label": "text",
"id": 4,
"page_no": 5,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 243.92,
"r": 286.37,
"b": 444.23,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 252.88,
"r_x1": 129.21,
"r_y1": 252.88,
"r_x2": 129.21,
"r_y2": 243.92,
"r_x3": 62.07,
"r_y3": 243.92,
"coord_origin": "TOPLEFT"
},
"text": "Loss Functions.",
"orig": "Loss Functions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.45,
"r_y0": 252.95,
"r_x1": 286.36,
"r_y1": 252.95,
"r_x2": 286.36,
"r_y2": 244.04,
"r_x3": 134.45,
"r_y3": 244.04,
"coord_origin": "TOPLEFT"
},
"text": "We formulate a multi-task loss Eq. 2",
"orig": "We formulate a multi-task loss Eq. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.9,
"r_x1": 286.37,
"r_y1": 264.9,
"r_x2": 286.37,
"r_y2": 256.0,
"r_x3": 50.11,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "to train our network. The Cross-Entropy loss (denoted as",
"orig": "to train our network. The Cross-Entropy loss (denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.64,
"r_x1": 56.85,
"r_y1": 276.64,
"r_x2": 56.85,
"r_y2": 267.79,
"r_x3": 50.11,
"r_y3": 267.79,
"coord_origin": "TOPLEFT"
},
"text": "l$_{s}$",
"orig": "l$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 57.34,
"r_y0": 276.86,
"r_x1": 135.4,
"r_y1": 276.86,
"r_x2": 135.4,
"r_y2": 267.95,
"r_x3": 57.34,
"r_y3": 267.95,
"coord_origin": "TOPLEFT"
},
"text": ") is used to train the",
"orig": ") is used to train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.74,
"r_y0": 276.63,
"r_x1": 211.08,
"r_y1": 276.63,
"r_x2": 211.08,
"r_y2": 268.04,
"r_x3": 137.74,
"r_y3": 268.04,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.64,
"r_y0": 276.86,
"r_x1": 286.36,
"r_y1": 276.86,
"r_x2": 286.36,
"r_y2": 267.95,
"r_x3": 213.64,
"r_y3": 267.95,
"coord_origin": "TOPLEFT"
},
"text": "which predicts the",
"orig": "which predicts the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.81,
"r_x1": 158.82,
"r_y1": 288.81,
"r_x2": 158.82,
"r_y2": 279.91,
"r_x3": 50.11,
"r_y3": 279.91,
"coord_origin": "TOPLEFT"
},
"text": "structure tokens. As for the",
"orig": "structure tokens. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.32,
"r_y0": 288.58,
"r_x1": 238.8,
"r_y1": 288.58,
"r_x2": 238.8,
"r_y2": 280.0,
"r_x3": 161.32,
"r_y3": 280.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.52,
"r_y0": 288.81,
"r_x1": 286.36,
"r_y1": 288.81,
"r_x2": 286.36,
"r_y2": 279.91,
"r_x3": 241.52,
"r_y3": 279.91,
"coord_origin": "TOPLEFT"
},
"text": "it is trained",
"orig": "it is trained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.77,
"r_x1": 211.38,
"r_y1": 300.77,
"r_x2": 211.38,
"r_y2": 291.86,
"r_x3": 50.11,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": "with a combination of losses denoted as",
"orig": "with a combination of losses denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.27,
"r_y0": 300.55,
"r_x1": 229.2,
"r_y1": 300.55,
"r_x2": 229.2,
"r_y2": 291.7,
"r_x3": 214.27,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 300.77,
"r_x1": 232.19,
"r_y1": 300.77,
"r_x2": 232.19,
"r_y2": 291.86,
"r_x3": 229.7,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.49,
"r_y0": 300.55,
"r_x1": 251.42,
"r_y1": 300.55,
"r_x2": 251.42,
"r_y2": 291.7,
"r_x3": 236.49,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.81,
"r_y0": 300.77,
"r_x1": 286.36,
"r_y1": 300.77,
"r_x2": 286.36,
"r_y2": 291.86,
"r_x3": 254.81,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": "consists",
"orig": "consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.72,
"r_x1": 137.45,
"r_y1": 312.72,
"r_x2": 137.45,
"r_y2": 303.82,
"r_x3": 50.11,
"r_y3": 303.82,
"coord_origin": "TOPLEFT"
},
"text": "of the generally used",
"orig": "of the generally used",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 141.3,
"r_y0": 312.5,
"r_x1": 148.24,
"r_y1": 312.5,
"r_x2": 148.24,
"r_y2": 303.66,
"r_x3": 141.3,
"r_y3": 303.66,
"coord_origin": "TOPLEFT"
},
"text": "l$_{1}$",
"orig": "l$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.59,
"r_y0": 312.72,
"r_x1": 286.36,
"r_y1": 312.72,
"r_x2": 286.36,
"r_y2": 303.82,
"r_x3": 152.59,
"r_y3": 303.82,
"coord_origin": "TOPLEFT"
},
"text": "loss for object detection and the",
"orig": "loss for object detection and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.68,
"r_x1": 89.68,
"r_y1": 324.68,
"r_x2": 89.68,
"r_y2": 315.77,
"r_x3": 50.11,
"r_y3": 315.77,
"coord_origin": "TOPLEFT"
},
"text": "IoU loss (",
"orig": "IoU loss (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.69,
"r_y0": 324.46,
"r_x1": 104.12,
"r_y1": 324.46,
"r_x2": 104.12,
"r_y2": 315.61,
"r_x3": 89.69,
"r_y3": 315.61,
"coord_origin": "TOPLEFT"
},
"text": "l$_{iou}$",
"orig": "l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.62,
"r_y0": 324.68,
"r_x1": 286.37,
"r_y1": 324.68,
"r_x2": 286.37,
"r_y2": 315.77,
"r_x3": 104.62,
"r_y3": 315.77,
"coord_origin": "TOPLEFT"
},
"text": ") to be scale invariant as explained in [25]. In",
"orig": ") to be scale invariant as explained in [25]. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.64,
"r_x1": 286.37,
"r_y1": 336.64,
"r_x2": 286.37,
"r_y2": 327.73,
"r_x3": 50.11,
"r_y3": 327.73,
"coord_origin": "TOPLEFT"
},
"text": "comparison to DETR, we do not use the Hungarian algo-",
"orig": "comparison to DETR, we do not use the Hungarian algo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.59,
"r_x1": 286.37,
"r_y1": 348.59,
"r_x2": 286.37,
"r_y2": 339.68,
"r_x3": 50.11,
"r_y3": 339.68,
"coord_origin": "TOPLEFT"
},
"text": "rithm [15] to match the predicted bounding boxes with the",
"orig": "rithm [15] to match the predicted bounding boxes with the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 360.54,
"r_x1": 286.37,
"r_y1": 360.54,
"r_x2": 286.37,
"r_y2": 351.64,
"r_x3": 50.11,
"r_y3": 351.64,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth boxes, as we have already achieved a one-to-",
"orig": "ground-truth boxes, as we have already achieved a one-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 372.5,
"r_x1": 286.37,
"r_y1": 372.5,
"r_x2": 286.37,
"r_y2": 363.59,
"r_x3": 50.11,
"r_y3": 363.59,
"coord_origin": "TOPLEFT"
},
"text": "one match through two steps: 1) Our token input sequence",
"orig": "one match through two steps: 1) Our token input sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 384.45,
"r_x1": 286.37,
"r_y1": 384.45,
"r_x2": 286.37,
"r_y2": 375.55,
"r_x3": 50.11,
"r_y3": 375.55,
"coord_origin": "TOPLEFT"
},
"text": "is naturally ordered, therefore the hidden states of the table",
"orig": "is naturally ordered, therefore the hidden states of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.41,
"r_x1": 286.37,
"r_y1": 396.41,
"r_x2": 286.37,
"r_y2": 387.5,
"r_x3": 50.11,
"r_y3": 387.5,
"coord_origin": "TOPLEFT"
},
"text": "data cells are also in order when they are provided as in-",
"orig": "data cells are also in order when they are provided as in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 408.37,
"r_x1": 88.69,
"r_y1": 408.37,
"r_x2": 88.69,
"r_y2": 399.46,
"r_x3": 50.11,
"r_y3": 399.46,
"coord_origin": "TOPLEFT"
},
"text": "put to the",
"orig": "put to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.65,
"r_y0": 408.14,
"r_x1": 170.05,
"r_y1": 408.14,
"r_x2": 170.05,
"r_y2": 399.55,
"r_x3": 91.65,
"r_y3": 399.55,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.05,
"r_y0": 408.37,
"r_x1": 286.36,
"r_y1": 408.37,
"r_x2": 286.36,
"r_y2": 399.46,
"r_x3": 170.05,
"r_y3": 399.46,
"coord_origin": "TOPLEFT"
},
"text": ", and 2) Our bounding boxes",
"orig": ", and 2) Our bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 420.32,
"r_x1": 181.97,
"r_y1": 420.32,
"r_x2": 181.97,
"r_y2": 411.41,
"r_x3": 50.11,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "generation mechanism (see Sec.",
"orig": "generation mechanism (see Sec.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.09,
"r_y0": 420.32,
"r_x1": 197.75,
"r_y1": 420.32,
"r_x2": 197.75,
"r_y2": 411.41,
"r_x3": 189.09,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "3)",
"orig": "3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.35,
"r_y0": 420.32,
"r_x1": 286.37,
"r_y1": 420.32,
"r_x2": 286.37,
"r_y2": 411.41,
"r_x3": 200.35,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "ensures a one-to-one",
"orig": "ensures a one-to-one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 432.28,
"r_x1": 286.37,
"r_y1": 432.28,
"r_x2": 286.37,
"r_y2": 423.37,
"r_x3": 50.11,
"r_y3": 423.37,
"coord_origin": "TOPLEFT"
},
"text": "mapping between the cell content and its bounding box for",
"orig": "mapping between the cell content and its bounding box for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 444.23,
"r_x1": 158.3,
"r_y1": 444.23,
"r_x2": 158.3,
"r_y2": 435.32,
"r_x3": 50.11,
"r_y3": 435.32,
"coord_origin": "TOPLEFT"
},
"text": "all post-processed datasets.",
"orig": "all post-processed datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l$_{s}$ ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l$_{box}$ . l$_{box}$ consists of the generally used l$_{1}$ loss for object detection and the IoU loss ( l$_{iou}$ ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets."
},
{
"label": "text",
"id": 11,
"page_no": 5,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 448.01,
"r": 286.36,
"b": 468.87,
"coord_origin": "TOPLEFT"
},
"confidence": 0.972,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 456.92,
"r_x1": 286.36,
"r_y1": 456.92,
"r_x2": 286.36,
"r_y2": 448.01,
"r_x3": 62.07,
"r_y3": 448.01,
"coord_origin": "TOPLEFT"
},
"text": "The loss used to train the TableFormer can be defined as",
"orig": "The loss used to train the TableFormer can be defined as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 468.87,
"r_x1": 91.38,
"r_y1": 468.87,
"r_x2": 91.38,
"r_y2": 459.97,
"r_x3": 50.11,
"r_y3": 459.97,
"coord_origin": "TOPLEFT"
},
"text": "following:",
"orig": "following:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The loss used to train the TableFormer can be defined as following:"
},
{
"label": "formula",
"id": 15,
"page_no": 5,
"cluster": {
"id": 15,
"label": "formula",
"bbox": {
"l": 124.33,
"t": 493.28,
"r": 286.36,
"b": 517.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.72,
"r_y0": 502.13,
"r_x1": 140.64,
"r_y1": 502.13,
"r_x2": 140.64,
"r_y2": 493.28,
"r_x3": 125.72,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.91,
"r_y0": 502.13,
"r_x1": 151.66,
"r_y1": 502.13,
"r_x2": 151.66,
"r_y2": 493.28,
"r_x3": 143.91,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.42,
"r_y0": 502.13,
"r_x1": 186.63,
"r_y1": 502.13,
"r_x2": 186.63,
"r_y2": 493.28,
"r_x3": 154.42,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$l$_{iou}$",
"orig": "\u03bb$_{iou}$l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.34,
"r_y0": 502.13,
"r_x1": 197.09,
"r_y1": 502.13,
"r_x2": 197.09,
"r_y2": 493.28,
"r_x3": 189.34,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "+",
"orig": "+",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.3,
"r_y0": 502.13,
"r_x1": 211.65,
"r_y1": 502.13,
"r_x2": 211.65,
"r_y2": 493.28,
"r_x3": 199.3,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.33,
"r_y0": 517.07,
"r_x1": 127.3,
"r_y1": 517.07,
"r_x2": 127.3,
"r_y2": 508.22,
"r_x3": 124.33,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "l",
"orig": "l",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.27,
"r_y0": 517.07,
"r_x1": 138.01,
"r_y1": 517.07,
"r_x2": 138.01,
"r_y2": 508.22,
"r_x3": 130.27,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.78,
"r_y0": 517.07,
"r_x1": 153.33,
"r_y1": 517.07,
"r_x2": 153.33,
"r_y2": 508.22,
"r_x3": 140.78,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "\u03bbl$_{s}$",
"orig": "\u03bbl$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.04,
"r_y0": 517.07,
"r_x1": 174.86,
"r_y1": 517.07,
"r_x2": 174.86,
"r_y2": 508.22,
"r_x3": 156.04,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "+ (1",
"orig": "+ (1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 177.07,
"r_y0": 517.07,
"r_x1": 184.82,
"r_y1": 517.07,
"r_x2": 184.82,
"r_y2": 507.67,
"r_x3": 177.07,
"r_y3": 507.67,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.03,
"r_y0": 517.07,
"r_x1": 192.84,
"r_y1": 517.07,
"r_x2": 192.84,
"r_y2": 508.22,
"r_x3": 187.03,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 192.85,
"r_y0": 517.07,
"r_x1": 196.72,
"r_y1": 517.07,
"r_x2": 196.72,
"r_y2": 508.22,
"r_x3": 192.85,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.72,
"r_y0": 517.07,
"r_x1": 211.65,
"r_y1": 517.07,
"r_x2": 211.65,
"r_y2": 508.22,
"r_x3": 196.72,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 509.92,
"r_x1": 286.36,
"r_y1": 509.92,
"r_x2": 286.36,
"r_y2": 501.01,
"r_x3": 274.75,
"r_y3": 501.01,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "l$_{box}$ = \u03bb$_{iou}$l$_{iou}$ + \u03bb$_{l}$$_{1}$ l = \u03bbl$_{s}$ + (1 \u2212 \u03bb ) l$_{box}$ (1)"
},
{
"label": "text",
"id": 16,
"page_no": 5,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 50.11,
"t": 530.59,
"r": 281.6,
"b": 540.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.936,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 540.22,
"r_x1": 74.45,
"r_y1": 540.22,
"r_x2": 74.45,
"r_y2": 531.31,
"r_x3": 50.11,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.94,
"r_y0": 540.0,
"r_x1": 82.75,
"r_y1": 540.0,
"r_x2": 82.75,
"r_y2": 531.15,
"r_x3": 76.94,
"r_y3": 531.15,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.52,
"r_y0": 540.0,
"r_x1": 92.16,
"r_y1": 540.0,
"r_x2": 92.16,
"r_y2": 530.59,
"r_x3": 85.52,
"r_y3": 530.59,
"coord_origin": "TOPLEFT"
},
"text": "\u2208",
"orig": "\u2208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.65,
"r_y0": 540.22,
"r_x1": 135.6,
"r_y1": 540.22,
"r_x2": 135.6,
"r_y2": 531.31,
"r_x3": 94.65,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "[0, 1], and",
"orig": "[0, 1], and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.09,
"r_y0": 540.0,
"r_x1": 172.63,
"r_y1": 540.0,
"r_x2": 172.63,
"r_y2": 531.15,
"r_x3": 138.09,
"r_y3": 531.15,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.9,
"r_y0": 540.0,
"r_x1": 192.5,
"r_y1": 540.0,
"r_x2": 192.5,
"r_y2": 530.59,
"r_x3": 175.9,
"r_y3": 530.59,
"coord_origin": "TOPLEFT"
},
"text": "\u2208$_{R}$",
"orig": "\u2208$_{R}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 194.99,
"r_y0": 540.22,
"r_x1": 281.6,
"r_y1": 540.22,
"r_x2": 281.6,
"r_y2": 531.31,
"r_x3": 194.99,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "are hyper-parameters.",
"orig": "are hyper-parameters.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where \u03bb \u2208 [0, 1], and \u03bb$_{iou}$, \u03bb$_{l}$$_{1}$ \u2208$_{R}$ are hyper-parameters."
},
{
"label": "section_header",
"id": 12,
"page_no": 5,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 555.92,
"r": 171.98,
"b": 566.66,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 566.66,
"r_x1": 57.93,
"r_y1": 566.66,
"r_x2": 57.93,
"r_y2": 555.92,
"r_x3": 50.11,
"r_y3": 555.92,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.35,
"r_y0": 566.66,
"r_x1": 171.98,
"r_y1": 566.66,
"r_x2": 171.98,
"r_y2": 555.92,
"r_x3": 68.35,
"r_y3": 555.92,
"coord_origin": "TOPLEFT"
},
"text": "Experimental Results",
"orig": "Experimental Results",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Experimental Results"
},
{
"label": "section_header",
"id": 13,
"page_no": 5,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 576.26,
"r": 179.18,
"b": 586.12,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 586.12,
"r_x1": 64.69,
"r_y1": 586.12,
"r_x2": 64.69,
"r_y2": 576.26,
"r_x3": 50.11,
"r_y3": 576.26,
"coord_origin": "TOPLEFT"
},
"text": "5.1.",
"orig": "5.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.41,
"r_y0": 586.12,
"r_x1": 179.18,
"r_y1": 586.12,
"r_x2": 179.18,
"r_y2": 576.26,
"r_x3": 74.41,
"r_y3": 576.26,
"coord_origin": "TOPLEFT"
},
"text": "Implementation Details",
"orig": "Implementation Details",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.1. Implementation Details"
},
{
"label": "text",
"id": 7,
"page_no": 5,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 595.73,
"r": 286.37,
"b": 640.51,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 604.64,
"r_x1": 202.98,
"r_y1": 604.64,
"r_x2": 202.98,
"r_y2": 595.73,
"r_x3": 62.07,
"r_y3": 595.73,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer uses ResNet-18 as the",
"orig": "TableFormer uses ResNet-18 as the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.38,
"r_y0": 604.41,
"r_x1": 286.36,
"r_y1": 604.41,
"r_x2": 286.36,
"r_y2": 595.82,
"r_x3": 205.38,
"r_y3": 595.82,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Net-",
"orig": "CNN Backbone Net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 616.37,
"r_x1": 70.04,
"r_y1": 616.37,
"r_x2": 70.04,
"r_y2": 607.78,
"r_x3": 50.11,
"r_y3": 607.78,
"coord_origin": "TOPLEFT"
},
"text": "work",
"orig": "work",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 616.6,
"r_x1": 286.36,
"r_y1": 616.6,
"r_x2": 286.36,
"r_y2": 607.69,
"r_x3": 70.04,
"r_y3": 607.69,
"coord_origin": "TOPLEFT"
},
"text": ". The input images are resized to 448*448 pixels and",
"orig": ". The input images are resized to 448*448 pixels and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 628.55,
"r_x1": 286.37,
"r_y1": 628.55,
"r_x2": 286.37,
"r_y2": 619.64,
"r_x3": 50.11,
"r_y3": 619.64,
"coord_origin": "TOPLEFT"
},
"text": "the feature map has a dimension of 28*28. Additionally, we",
"orig": "the feature map has a dimension of 28*28. Additionally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 640.51,
"r_x1": 207.03,
"r_y1": 640.51,
"r_x2": 207.03,
"r_y2": 631.6,
"r_x3": 50.11,
"r_y3": 631.6,
"coord_origin": "TOPLEFT"
},
"text": "enforce the following input constraints:",
"orig": "enforce the following input constraints:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:"
},
{
"label": "formula",
"id": 18,
"page_no": 5,
"cluster": {
"id": 18,
"label": "formula",
"bbox": {
"l": 91.66,
"t": 653.83,
"r": 286.36,
"b": 678.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.844,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.66,
"r_y0": 663.45,
"r_x1": 186.02,
"r_y1": 663.45,
"r_x2": 186.02,
"r_y2": 654.55,
"r_x3": 91.66,
"r_y3": 654.55,
"coord_origin": "TOPLEFT"
},
"text": "Image width and height",
"orig": "Image width and height",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.51,
"r_y0": 663.23,
"r_x1": 196.26,
"r_y1": 663.23,
"r_x2": 196.26,
"r_y2": 653.83,
"r_x3": 188.51,
"r_y3": 653.83,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.75,
"r_y0": 663.45,
"r_x1": 244.81,
"r_y1": 663.45,
"r_x2": 244.81,
"r_y2": 654.55,
"r_x3": 198.75,
"r_y3": 654.55,
"coord_origin": "TOPLEFT"
},
"text": "1024 pixels",
"orig": "1024 pixels",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.02,
"r_y0": 678.4,
"r_x1": 186.25,
"r_y1": 678.4,
"r_x2": 186.25,
"r_y2": 669.49,
"r_x3": 101.02,
"r_y3": 669.49,
"coord_origin": "TOPLEFT"
},
"text": "Structural tags length",
"orig": "Structural tags length",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.74,
"r_y0": 678.18,
"r_x1": 196.48,
"r_y1": 678.18,
"r_x2": 196.48,
"r_y2": 668.77,
"r_x3": 188.74,
"r_y3": 668.77,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.98,
"r_y0": 678.4,
"r_x1": 244.81,
"r_y1": 678.4,
"r_x2": 244.81,
"r_y2": 669.49,
"r_x3": 198.98,
"r_y3": 669.49,
"coord_origin": "TOPLEFT"
},
"text": "512 tokens.",
"orig": "512 tokens.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 671.02,
"r_x1": 286.36,
"r_y1": 671.02,
"r_x2": 286.36,
"r_y2": 662.12,
"r_x3": 274.75,
"r_y3": 662.12,
"coord_origin": "TOPLEFT"
},
"text": "(2)",
"orig": "(2)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)"
},
{
"label": "text",
"id": 10,
"page_no": 5,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 692.29,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.972,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Although input constraints are used also by other methods,",
"orig": "Although input constraints are used also by other methods,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "such as EDD, ours are less restrictive due to the improved",
"orig": "such as EDD, ours are less restrictive due to the improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved"
},
{
"label": "text",
"id": 9,
"page_no": 5,
"cluster": {
"id": 9,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 545.12,
"r_y1": 84.11,
"r_x2": 545.12,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "runtime performance and lower memory footprint of Table-",
"orig": "runtime performance and lower memory footprint of Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 339.99,
"r_y1": 96.07,
"r_x2": 339.99,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "Former.",
"orig": "Former.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.89,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 346.89,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "This allows to utilize input samples with longer",
"orig": "This allows to utilize input samples with longer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 492.96,
"r_y1": 108.02,
"r_x2": 492.96,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "sequences and images with larger dimensions.",
"orig": "sequences and images with larger dimensions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions."
},
{
"label": "text",
"id": 1,
"page_no": 5,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 116.23,
"r": 545.12,
"b": 328.37,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 125.14,
"r_x1": 545.11,
"r_y1": 125.14,
"r_x2": 545.11,
"r_y2": 116.23,
"r_x3": 320.82,
"r_y3": 116.23,
"coord_origin": "TOPLEFT"
},
"text": "The Transformer Encoder consists of two \u201cTransformer",
"orig": "The Transformer Encoder consists of two \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 137.09,
"r_x1": 545.12,
"r_y1": 137.09,
"r_x2": 545.12,
"r_y2": 128.18,
"r_x3": 308.86,
"r_y3": 128.18,
"coord_origin": "TOPLEFT"
},
"text": "Encoder Layers\u201d, with an input feature size of 512, feed",
"orig": "Encoder Layers\u201d, with an input feature size of 512, feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 149.05,
"r_x1": 545.12,
"r_y1": 149.05,
"r_x2": 545.12,
"r_y2": 140.14,
"r_x3": 308.86,
"r_y3": 140.14,
"coord_origin": "TOPLEFT"
},
"text": "forward network of 1024, and 4 attention heads. As for the",
"orig": "forward network of 1024, and 4 attention heads. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 161.0,
"r_x1": 545.12,
"r_y1": 161.0,
"r_x2": 545.12,
"r_y2": 152.09,
"r_x3": 308.86,
"r_y3": 152.09,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder it is composed of four \u201cTransformer",
"orig": "Transformer Decoder it is composed of four \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 172.96,
"r_x1": 545.12,
"r_y1": 172.96,
"r_x2": 545.12,
"r_y2": 164.05,
"r_x3": 308.86,
"r_y3": 164.05,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Layers\u201d with similar input and output dimensions",
"orig": "Decoder Layers\u201d with similar input and output dimensions",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 184.91,
"r_x1": 467.22,
"r_y1": 184.91,
"r_x2": 467.22,
"r_y2": 176.01,
"r_x3": 308.86,
"r_y3": 176.01,
"coord_origin": "TOPLEFT"
},
"text": "as the \u201cTransformer Encoder Layers\u201d.",
"orig": "as the \u201cTransformer Encoder Layers\u201d.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.44,
"r_y0": 184.91,
"r_x1": 545.12,
"r_y1": 184.91,
"r_x2": 545.12,
"r_y2": 176.01,
"r_x3": 475.44,
"r_y3": 176.01,
"coord_origin": "TOPLEFT"
},
"text": "Even though our",
"orig": "Even though our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 196.87,
"r_x1": 545.12,
"r_y1": 196.87,
"r_x2": 545.12,
"r_y2": 187.96,
"r_x3": 308.86,
"r_y3": 187.96,
"coord_origin": "TOPLEFT"
},
"text": "model uses fewer layers and heads than the default imple-",
"orig": "model uses fewer layers and heads than the default imple-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 208.82,
"r_x1": 545.12,
"r_y1": 208.82,
"r_x2": 545.12,
"r_y2": 199.92,
"r_x3": 308.86,
"r_y3": 199.92,
"coord_origin": "TOPLEFT"
},
"text": "mentation parameters, our extensive experimentation has",
"orig": "mentation parameters, our extensive experimentation has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 220.78,
"r_x1": 545.12,
"r_y1": 220.78,
"r_x2": 545.12,
"r_y2": 211.87,
"r_x3": 308.86,
"r_y3": 211.87,
"coord_origin": "TOPLEFT"
},
"text": "proved this setup to be more suitable for table images. We",
"orig": "proved this setup to be more suitable for table images. We",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 232.73,
"r_x1": 545.12,
"r_y1": 232.73,
"r_x2": 545.12,
"r_y2": 223.83,
"r_x3": 308.86,
"r_y3": 223.83,
"coord_origin": "TOPLEFT"
},
"text": "attribute this finding to the inherent design of table im-",
"orig": "attribute this finding to the inherent design of table im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 244.69,
"r_x1": 545.12,
"r_y1": 244.69,
"r_x2": 545.12,
"r_y2": 235.78,
"r_x3": 308.86,
"r_y3": 235.78,
"coord_origin": "TOPLEFT"
},
"text": "ages, which contain mostly lines and text, unlike the more",
"orig": "ages, which contain mostly lines and text, unlike the more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 256.64,
"r_x1": 545.12,
"r_y1": 256.64,
"r_x2": 545.12,
"r_y2": 247.74,
"r_x3": 308.86,
"r_y3": 247.74,
"coord_origin": "TOPLEFT"
},
"text": "elaborate content present in other scopes (e.g. the COCO",
"orig": "elaborate content present in other scopes (e.g. the COCO",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 268.6,
"r_x1": 342.34,
"r_y1": 268.6,
"r_x2": 342.34,
"r_y2": 259.69,
"r_x3": 308.86,
"r_y3": 259.69,
"coord_origin": "TOPLEFT"
},
"text": "dataset).",
"orig": "dataset).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.95,
"r_y0": 268.6,
"r_x1": 545.12,
"r_y1": 268.6,
"r_x2": 545.12,
"r_y2": 259.69,
"r_x3": 348.95,
"r_y3": 259.69,
"coord_origin": "TOPLEFT"
},
"text": "Moreover, we have added ResNet blocks to the",
"orig": "Moreover, we have added ResNet blocks to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 280.55,
"r_x1": 545.12,
"r_y1": 280.55,
"r_x2": 545.12,
"r_y2": 271.65,
"r_x3": 308.86,
"r_y3": 271.65,
"coord_origin": "TOPLEFT"
},
"text": "inputs of the Structure Decoder and Cell BBox Decoder.",
"orig": "inputs of the Structure Decoder and Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 292.51,
"r_x1": 545.12,
"r_y1": 292.51,
"r_x2": 545.12,
"r_y2": 283.6,
"r_x3": 308.86,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "This prevents a decoder having a stronger influence over the",
"orig": "This prevents a decoder having a stronger influence over the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.46,
"r_x1": 545.12,
"r_y1": 304.46,
"r_x2": 545.12,
"r_y2": 295.56,
"r_x3": 308.86,
"r_y3": 295.56,
"coord_origin": "TOPLEFT"
},
"text": "learned weights which would damage the other prediction",
"orig": "learned weights which would damage the other prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.42,
"r_x1": 545.12,
"r_y1": 316.42,
"r_x2": 545.12,
"r_y2": 307.51,
"r_x3": 308.86,
"r_y3": 307.51,
"coord_origin": "TOPLEFT"
},
"text": "task (structure vs bounding boxes), but learn task specific",
"orig": "task (structure vs bounding boxes), but learn task specific",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 328.37,
"r_x1": 532.48,
"r_y1": 328.37,
"r_x2": 532.48,
"r_y2": 319.47,
"r_x3": 308.86,
"r_y3": 319.47,
"coord_origin": "TOPLEFT"
},
"text": "weights instead. Lastly our dropout layers are set to 0.5.",
"orig": "weights instead. Lastly our dropout layers are set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The Transformer Encoder consists of two \"Transformer Encoder Layers\", with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four \"Transformer Decoder Layers\" with similar input and output dimensions as the \"Transformer Encoder Layers\". Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5."
},
{
"label": "text",
"id": 3,
"page_no": 5,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 336.58,
"r": 545.12,
"b": 429.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 345.48,
"r_x1": 545.11,
"r_y1": 345.48,
"r_x2": 545.11,
"r_y2": 336.58,
"r_x3": 320.82,
"r_y3": 336.58,
"coord_origin": "TOPLEFT"
},
"text": "For training, TableFormer is trained with 3 Adam opti-",
"orig": "For training, TableFormer is trained with 3 Adam opti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 357.44,
"r_x1": 403.74,
"r_y1": 357.44,
"r_x2": 403.74,
"r_y2": 348.53,
"r_x3": 308.86,
"r_y3": 348.53,
"coord_origin": "TOPLEFT"
},
"text": "mizers, each one for the",
"orig": "mizers, each one for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.08,
"r_y0": 357.21,
"r_x1": 503.54,
"r_y1": 357.21,
"r_x2": 503.54,
"r_y2": 348.62,
"r_x3": 406.08,
"r_y3": 348.62,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 503.54,
"r_y0": 357.44,
"r_x1": 506.03,
"r_y1": 357.44,
"r_x2": 506.03,
"r_y2": 348.53,
"r_x3": 503.54,
"r_y3": 348.53,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.4,
"r_y0": 357.21,
"r_x1": 545.11,
"r_y1": 357.21,
"r_x2": 545.11,
"r_y2": 348.62,
"r_x3": 508.4,
"r_y3": 348.62,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 369.16,
"r_x1": 343.16,
"r_y1": 369.16,
"r_x2": 343.16,
"r_y2": 360.58,
"r_x3": 308.86,
"r_y3": 360.58,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.16,
"r_y0": 369.39,
"r_x1": 362.2,
"r_y1": 369.39,
"r_x2": 362.2,
"r_y2": 360.49,
"r_x3": 343.16,
"r_y3": 360.49,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 364.29,
"r_y0": 369.16,
"r_x1": 440.94,
"r_y1": 369.16,
"r_x2": 440.94,
"r_y2": 360.58,
"r_x3": 364.29,
"r_y3": 360.58,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.94,
"r_y0": 369.39,
"r_x1": 545.11,
"r_y1": 369.39,
"r_x2": 545.11,
"r_y2": 360.49,
"r_x3": 440.94,
"r_y3": 360.49,
"coord_origin": "TOPLEFT"
},
"text": ". Taking the PubTabNet as",
"orig": ". Taking the PubTabNet as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 381.35,
"r_x1": 545.12,
"r_y1": 381.35,
"r_x2": 545.12,
"r_y2": 372.44,
"r_x3": 308.86,
"r_y3": 372.44,
"coord_origin": "TOPLEFT"
},
"text": "an example for our parameter set up, the initializing learn-",
"orig": "an example for our parameter set up, the initializing learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 393.31,
"r_x1": 545.12,
"r_y1": 393.31,
"r_x2": 545.12,
"r_y2": 384.4,
"r_x3": 308.86,
"r_y3": 384.4,
"coord_origin": "TOPLEFT"
},
"text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 405.04,
"r_x1": 314.67,
"r_y1": 405.04,
"r_x2": 314.67,
"r_y2": 396.19,
"r_x3": 308.86,
"r_y3": 396.19,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.66,
"r_y0": 405.26,
"r_x1": 360.39,
"r_y1": 405.26,
"r_x2": 360.39,
"r_y2": 396.35,
"r_x3": 318.66,
"r_y3": 396.35,
"coord_origin": "TOPLEFT"
},
"text": "set to 0.5.",
"orig": "set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.96,
"r_y0": 405.26,
"r_x1": 545.11,
"r_y1": 405.26,
"r_x2": 545.11,
"r_y2": 396.35,
"r_x3": 367.96,
"r_y3": 396.35,
"coord_origin": "TOPLEFT"
},
"text": "Afterwards, we reduce the learning rate to",
"orig": "Afterwards, we reduce the learning rate to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 417.21,
"r_x1": 545.12,
"r_y1": 417.21,
"r_x2": 545.12,
"r_y2": 408.31,
"r_x3": 308.86,
"r_y3": 408.31,
"coord_origin": "TOPLEFT"
},
"text": "0.0001, the batch size to 18 and train for 12 more epochs or",
"orig": "0.0001, the batch size to 18 and train for 12 more epochs or",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 429.17,
"r_x1": 360.97,
"r_y1": 429.17,
"r_x2": 360.97,
"r_y2": 420.26,
"r_x3": 308.86,
"r_y3": 420.26,
"coord_origin": "TOPLEFT"
},
"text": "convergence.",
"orig": "convergence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network , Structure Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence."
},
{
"label": "text",
"id": 0,
"page_no": 5,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 437.37,
"r": 545.12,
"b": 553.88,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 446.28,
"r_x1": 545.11,
"r_y1": 446.28,
"r_x2": 545.11,
"r_y2": 437.37,
"r_x3": 320.82,
"r_y3": 437.37,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is implemented with PyTorch and Torchvi-",
"orig": "TableFormer is implemented with PyTorch and Torchvi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 458.24,
"r_x1": 384.63,
"r_y1": 458.24,
"r_x2": 384.63,
"r_y2": 449.33,
"r_x3": 308.86,
"r_y3": 449.33,
"coord_origin": "TOPLEFT"
},
"text": "sion libraries [22].",
"orig": "sion libraries [22].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 458.24,
"r_x1": 545.12,
"r_y1": 458.24,
"r_x2": 545.12,
"r_y2": 449.33,
"r_x3": 391.37,
"r_y3": 449.33,
"coord_origin": "TOPLEFT"
},
"text": "To speed up the inference, the image",
"orig": "To speed up the inference, the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 470.19,
"r_x1": 494.01,
"r_y1": 470.19,
"r_x2": 494.01,
"r_y2": 461.28,
"r_x3": 308.86,
"r_y3": 461.28,
"coord_origin": "TOPLEFT"
},
"text": "undergoes a single forward pass through the",
"orig": "undergoes a single forward pass through the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.08,
"r_y0": 469.96,
"r_x1": 545.11,
"r_y1": 469.96,
"r_x2": 545.11,
"r_y2": 461.37,
"r_x3": 498.08,
"r_y3": 461.37,
"coord_origin": "TOPLEFT"
},
"text": "CNN Back-",
"orig": "CNN Back-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 481.92,
"r_x1": 364.44,
"r_y1": 481.92,
"r_x2": 364.44,
"r_y2": 473.33,
"r_x3": 308.86,
"r_y3": 473.33,
"coord_origin": "TOPLEFT"
},
"text": "bone Network",
"orig": "bone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.06,
"r_y0": 482.15,
"r_x1": 545.11,
"r_y1": 482.15,
"r_x2": 545.11,
"r_y2": 473.24,
"r_x3": 367.06,
"r_y3": 473.24,
"coord_origin": "TOPLEFT"
},
"text": "and transformer encoder. This eliminates the",
"orig": "and transformer encoder. This eliminates the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 494.1,
"r_x1": 545.12,
"r_y1": 494.1,
"r_x2": 545.12,
"r_y2": 485.19,
"r_x3": 308.86,
"r_y3": 485.19,
"coord_origin": "TOPLEFT"
},
"text": "overhead of generating the same features for each decoding",
"orig": "overhead of generating the same features for each decoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 506.06,
"r_x1": 545.12,
"r_y1": 506.06,
"r_x2": 545.12,
"r_y2": 497.15,
"r_x3": 308.86,
"r_y3": 497.15,
"coord_origin": "TOPLEFT"
},
"text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 518.01,
"r_x1": 545.12,
"r_y1": 518.01,
"r_x2": 545.12,
"r_y2": 509.11,
"r_x3": 308.86,
"r_y3": 509.11,
"coord_origin": "TOPLEFT"
},
"text": "faster autoregressive decoding. This is achieved by storing",
"orig": "faster autoregressive decoding. This is achieved by storing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 529.97,
"r_x1": 545.12,
"r_y1": 529.97,
"r_x2": 545.12,
"r_y2": 521.06,
"r_x3": 308.86,
"r_y3": 521.06,
"coord_origin": "TOPLEFT"
},
"text": "the features of decoded tokens so we can reuse them for",
"orig": "the features of decoded tokens so we can reuse them for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 541.92,
"r_x1": 545.12,
"r_y1": 541.92,
"r_x2": 545.12,
"r_y2": 533.02,
"r_x3": 308.86,
"r_y3": 533.02,
"coord_origin": "TOPLEFT"
},
"text": "each time step. Therefore, we only compute the attention",
"orig": "each time step. Therefore, we only compute the attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 553.88,
"r_x1": 377.22,
"r_y1": 553.88,
"r_x2": 377.22,
"r_y2": 544.97,
"r_x3": 308.86,
"r_y3": 544.97,
"coord_origin": "TOPLEFT"
},
"text": "for each new tag.",
"orig": "for each new tag.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag."
},
{
"label": "section_header",
"id": 14,
"page_no": 5,
"cluster": {
"id": 14,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 579.55,
"r": 397.44,
"b": 589.41,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 589.41,
"r_x1": 323.9,
"r_y1": 589.41,
"r_x2": 323.9,
"r_y2": 579.55,
"r_x3": 308.86,
"r_y3": 579.55,
"coord_origin": "TOPLEFT"
},
"text": "5.2.",
"orig": "5.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.93,
"r_y0": 589.41,
"r_x1": 397.44,
"r_y1": 589.41,
"r_x2": 397.44,
"r_y2": 579.55,
"r_x3": 333.93,
"r_y3": 579.55,
"coord_origin": "TOPLEFT"
},
"text": "Generalization",
"orig": "Generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.2. Generalization"
},
{
"label": "text",
"id": 2,
"page_no": 5,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 603.45,
"r": 545.12,
"b": 672.13,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 612.36,
"r_x1": 545.11,
"r_y1": 612.36,
"r_x2": 545.11,
"r_y2": 603.45,
"r_x3": 320.82,
"r_y3": 603.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is evaluated on three major publicly avail-",
"orig": "TableFormer is evaluated on three major publicly avail-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 624.31,
"r_x1": 545.12,
"r_y1": 624.31,
"r_x2": 545.12,
"r_y2": 615.4,
"r_x3": 308.86,
"r_y3": 615.4,
"coord_origin": "TOPLEFT"
},
"text": "able datasets of different nature to prove the generalization",
"orig": "able datasets of different nature to prove the generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 636.27,
"r_x1": 545.12,
"r_y1": 636.27,
"r_x2": 545.12,
"r_y2": 627.36,
"r_x3": 308.86,
"r_y3": 627.36,
"coord_origin": "TOPLEFT"
},
"text": "and effectiveness of our model. The datasets used for eval-",
"orig": "and effectiveness of our model. The datasets used for eval-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 648.22,
"r_x1": 545.12,
"r_y1": 648.22,
"r_x2": 545.12,
"r_y2": 639.31,
"r_x3": 308.86,
"r_y3": 639.31,
"coord_origin": "TOPLEFT"
},
"text": "uation are the PubTabNet, FinTabNet and TableBank which",
"orig": "uation are the PubTabNet, FinTabNet and TableBank which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 660.18,
"r_x1": 545.12,
"r_y1": 660.18,
"r_x2": 545.12,
"r_y2": 651.27,
"r_x3": 308.86,
"r_y3": 651.27,
"coord_origin": "TOPLEFT"
},
"text": "stem from the scientific, financial and general domains re-",
"orig": "stem from the scientific, financial and general domains re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 672.13,
"r_x1": 350.7,
"r_y1": 672.13,
"r_x2": 350.7,
"r_y2": 663.23,
"r_x3": 308.86,
"r_y3": 663.23,
"coord_origin": "TOPLEFT"
},
"text": "spectively.",
"orig": "spectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively."
},
{
"label": "text",
"id": 8,
"page_no": 5,
"cluster": {
"id": 8,
"label": "text",
"bbox": {
"l": 308.86,
"t": 680.34,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 320.82,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "We also share our baseline results on the challenging",
"orig": "We also share our baseline results on the challenging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 396.21,
"r_y1": 701.2,
"r_x2": 396.21,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet dataset.",
"orig": "SynthTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.41,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 406.41,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Throughout our experiments, the",
"orig": "Throughout our experiments, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 495.94,
"r_y1": 713.15,
"r_x2": 495.94,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "same parameters stated in Sec. 5.1 are utilized.",
"orig": "same parameters stated in Sec. 5.1 are utilized.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized."
},
{
"label": "page_footer",
"id": 17,
"page_no": 5,
"cluster": {
"id": 17,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6"
}
],
"body": [
{
"label": "text",
"id": 5,
"page_no": 5,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 286.37,
"b": 155.85,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 286.37,
"r_y1": 84.11,
"r_x2": 286.37,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "tention encoding is then multiplied to the encoded image to",
"orig": "tention encoding is then multiplied to the encoded image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 96.07,
"r_x1": 286.37,
"r_y1": 96.07,
"r_x2": 286.37,
"r_y2": 87.16,
"r_x3": 50.11,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "produce a feature for each table cell. Notice that this is dif-",
"orig": "produce a feature for each table cell. Notice that this is dif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.02,
"r_x1": 286.37,
"r_y1": 108.02,
"r_x2": 286.37,
"r_y2": 99.12,
"r_x3": 50.11,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "ferent than the typical object detection problem where im-",
"orig": "ferent than the typical object detection problem where im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 119.98,
"r_x1": 286.37,
"r_y1": 119.98,
"r_x2": 286.37,
"r_y2": 111.07,
"r_x3": 50.11,
"r_y3": 111.07,
"coord_origin": "TOPLEFT"
},
"text": "balances between the number of detections and the amount",
"orig": "balances between the number of detections and the amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.93,
"r_x1": 286.37,
"r_y1": 131.93,
"r_x2": 286.37,
"r_y2": 123.03,
"r_x3": 50.11,
"r_y3": 123.03,
"coord_origin": "TOPLEFT"
},
"text": "of objects may exist. In our case, we know up front that",
"orig": "of objects may exist. In our case, we know up front that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 143.89,
"r_x1": 286.37,
"r_y1": 143.89,
"r_x2": 286.37,
"r_y2": 134.98,
"r_x3": 50.11,
"r_y3": 134.98,
"coord_origin": "TOPLEFT"
},
"text": "the produced detections always match with the table cells",
"orig": "the produced detections always match with the table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 155.85,
"r_x1": 175.16,
"r_y1": 155.85,
"r_x2": 175.16,
"r_y2": 146.94,
"r_x3": 50.11,
"r_y3": 146.94,
"coord_origin": "TOPLEFT"
},
"text": "in number and correspondence.",
"orig": "in number and correspondence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence."
},
{
"label": "text",
"id": 6,
"page_no": 5,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 50.11,
"t": 159.62,
"r": 286.37,
"b": 240.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 168.53,
"r_x1": 286.36,
"r_y1": 168.53,
"r_x2": 286.36,
"r_y2": 159.62,
"r_x3": 62.07,
"r_y3": 159.62,
"coord_origin": "TOPLEFT"
},
"text": "The output features for each table cell are then fed",
"orig": "The output features for each table cell are then fed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 180.49,
"r_x1": 286.37,
"r_y1": 180.49,
"r_x2": 286.37,
"r_y2": 171.58,
"r_x3": 50.11,
"r_y3": 171.58,
"coord_origin": "TOPLEFT"
},
"text": "into the feed-forward network (FFN). The FFN consists",
"orig": "into the feed-forward network (FFN). The FFN consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 192.44,
"r_x1": 286.37,
"r_y1": 192.44,
"r_x2": 286.37,
"r_y2": 183.54,
"r_x3": 50.11,
"r_y3": 183.54,
"coord_origin": "TOPLEFT"
},
"text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 204.4,
"r_x1": 286.37,
"r_y1": 204.4,
"r_x2": 286.37,
"r_y2": 195.49,
"r_x3": 50.11,
"r_y3": 195.49,
"coord_origin": "TOPLEFT"
},
"text": "tion function) that predicts the normalized coordinates for",
"orig": "tion function) that predicts the normalized coordinates for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 216.35,
"r_x1": 286.37,
"r_y1": 216.35,
"r_x2": 286.37,
"r_y2": 207.45,
"r_x3": 50.11,
"r_y3": 207.45,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table cell. Finally, the predicted",
"orig": "the bounding box of each table cell. Finally, the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 228.31,
"r_x1": 286.37,
"r_y1": 228.31,
"r_x2": 286.37,
"r_y2": 219.4,
"r_x3": 50.11,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes are classified based on whether they are",
"orig": "bounding boxes are classified based on whether they are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 240.26,
"r_x1": 181.55,
"r_y1": 240.26,
"r_x2": 181.55,
"r_y2": 231.36,
"r_x3": 50.11,
"r_y3": 231.36,
"coord_origin": "TOPLEFT"
},
"text": "empty or not using a linear layer.",
"orig": "empty or not using a linear layer.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer."
},
{
"label": "text",
"id": 4,
"page_no": 5,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.11,
"t": 243.92,
"r": 286.37,
"b": 444.23,
"coord_origin": "TOPLEFT"
},
"confidence": 0.987,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 252.88,
"r_x1": 129.21,
"r_y1": 252.88,
"r_x2": 129.21,
"r_y2": 243.92,
"r_x3": 62.07,
"r_y3": 243.92,
"coord_origin": "TOPLEFT"
},
"text": "Loss Functions.",
"orig": "Loss Functions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.45,
"r_y0": 252.95,
"r_x1": 286.36,
"r_y1": 252.95,
"r_x2": 286.36,
"r_y2": 244.04,
"r_x3": 134.45,
"r_y3": 244.04,
"coord_origin": "TOPLEFT"
},
"text": "We formulate a multi-task loss Eq. 2",
"orig": "We formulate a multi-task loss Eq. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.9,
"r_x1": 286.37,
"r_y1": 264.9,
"r_x2": 286.37,
"r_y2": 256.0,
"r_x3": 50.11,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "to train our network. The Cross-Entropy loss (denoted as",
"orig": "to train our network. The Cross-Entropy loss (denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.64,
"r_x1": 56.85,
"r_y1": 276.64,
"r_x2": 56.85,
"r_y2": 267.79,
"r_x3": 50.11,
"r_y3": 267.79,
"coord_origin": "TOPLEFT"
},
"text": "l$_{s}$",
"orig": "l$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 57.34,
"r_y0": 276.86,
"r_x1": 135.4,
"r_y1": 276.86,
"r_x2": 135.4,
"r_y2": 267.95,
"r_x3": 57.34,
"r_y3": 267.95,
"coord_origin": "TOPLEFT"
},
"text": ") is used to train the",
"orig": ") is used to train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.74,
"r_y0": 276.63,
"r_x1": 211.08,
"r_y1": 276.63,
"r_x2": 211.08,
"r_y2": 268.04,
"r_x3": 137.74,
"r_y3": 268.04,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.64,
"r_y0": 276.86,
"r_x1": 286.36,
"r_y1": 276.86,
"r_x2": 286.36,
"r_y2": 267.95,
"r_x3": 213.64,
"r_y3": 267.95,
"coord_origin": "TOPLEFT"
},
"text": "which predicts the",
"orig": "which predicts the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.81,
"r_x1": 158.82,
"r_y1": 288.81,
"r_x2": 158.82,
"r_y2": 279.91,
"r_x3": 50.11,
"r_y3": 279.91,
"coord_origin": "TOPLEFT"
},
"text": "structure tokens. As for the",
"orig": "structure tokens. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.32,
"r_y0": 288.58,
"r_x1": 238.8,
"r_y1": 288.58,
"r_x2": 238.8,
"r_y2": 280.0,
"r_x3": 161.32,
"r_y3": 280.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.52,
"r_y0": 288.81,
"r_x1": 286.36,
"r_y1": 288.81,
"r_x2": 286.36,
"r_y2": 279.91,
"r_x3": 241.52,
"r_y3": 279.91,
"coord_origin": "TOPLEFT"
},
"text": "it is trained",
"orig": "it is trained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.77,
"r_x1": 211.38,
"r_y1": 300.77,
"r_x2": 211.38,
"r_y2": 291.86,
"r_x3": 50.11,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": "with a combination of losses denoted as",
"orig": "with a combination of losses denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.27,
"r_y0": 300.55,
"r_x1": 229.2,
"r_y1": 300.55,
"r_x2": 229.2,
"r_y2": 291.7,
"r_x3": 214.27,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 300.77,
"r_x1": 232.19,
"r_y1": 300.77,
"r_x2": 232.19,
"r_y2": 291.86,
"r_x3": 229.7,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.49,
"r_y0": 300.55,
"r_x1": 251.42,
"r_y1": 300.55,
"r_x2": 251.42,
"r_y2": 291.7,
"r_x3": 236.49,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.81,
"r_y0": 300.77,
"r_x1": 286.36,
"r_y1": 300.77,
"r_x2": 286.36,
"r_y2": 291.86,
"r_x3": 254.81,
"r_y3": 291.86,
"coord_origin": "TOPLEFT"
},
"text": "consists",
"orig": "consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.72,
"r_x1": 137.45,
"r_y1": 312.72,
"r_x2": 137.45,
"r_y2": 303.82,
"r_x3": 50.11,
"r_y3": 303.82,
"coord_origin": "TOPLEFT"
},
"text": "of the generally used",
"orig": "of the generally used",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 141.3,
"r_y0": 312.5,
"r_x1": 148.24,
"r_y1": 312.5,
"r_x2": 148.24,
"r_y2": 303.66,
"r_x3": 141.3,
"r_y3": 303.66,
"coord_origin": "TOPLEFT"
},
"text": "l$_{1}$",
"orig": "l$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.59,
"r_y0": 312.72,
"r_x1": 286.36,
"r_y1": 312.72,
"r_x2": 286.36,
"r_y2": 303.82,
"r_x3": 152.59,
"r_y3": 303.82,
"coord_origin": "TOPLEFT"
},
"text": "loss for object detection and the",
"orig": "loss for object detection and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.68,
"r_x1": 89.68,
"r_y1": 324.68,
"r_x2": 89.68,
"r_y2": 315.77,
"r_x3": 50.11,
"r_y3": 315.77,
"coord_origin": "TOPLEFT"
},
"text": "IoU loss (",
"orig": "IoU loss (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.69,
"r_y0": 324.46,
"r_x1": 104.12,
"r_y1": 324.46,
"r_x2": 104.12,
"r_y2": 315.61,
"r_x3": 89.69,
"r_y3": 315.61,
"coord_origin": "TOPLEFT"
},
"text": "l$_{iou}$",
"orig": "l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.62,
"r_y0": 324.68,
"r_x1": 286.37,
"r_y1": 324.68,
"r_x2": 286.37,
"r_y2": 315.77,
"r_x3": 104.62,
"r_y3": 315.77,
"coord_origin": "TOPLEFT"
},
"text": ") to be scale invariant as explained in [25]. In",
"orig": ") to be scale invariant as explained in [25]. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.64,
"r_x1": 286.37,
"r_y1": 336.64,
"r_x2": 286.37,
"r_y2": 327.73,
"r_x3": 50.11,
"r_y3": 327.73,
"coord_origin": "TOPLEFT"
},
"text": "comparison to DETR, we do not use the Hungarian algo-",
"orig": "comparison to DETR, we do not use the Hungarian algo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.59,
"r_x1": 286.37,
"r_y1": 348.59,
"r_x2": 286.37,
"r_y2": 339.68,
"r_x3": 50.11,
"r_y3": 339.68,
"coord_origin": "TOPLEFT"
},
"text": "rithm [15] to match the predicted bounding boxes with the",
"orig": "rithm [15] to match the predicted bounding boxes with the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 360.54,
"r_x1": 286.37,
"r_y1": 360.54,
"r_x2": 286.37,
"r_y2": 351.64,
"r_x3": 50.11,
"r_y3": 351.64,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth boxes, as we have already achieved a one-to-",
"orig": "ground-truth boxes, as we have already achieved a one-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 372.5,
"r_x1": 286.37,
"r_y1": 372.5,
"r_x2": 286.37,
"r_y2": 363.59,
"r_x3": 50.11,
"r_y3": 363.59,
"coord_origin": "TOPLEFT"
},
"text": "one match through two steps: 1) Our token input sequence",
"orig": "one match through two steps: 1) Our token input sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 384.45,
"r_x1": 286.37,
"r_y1": 384.45,
"r_x2": 286.37,
"r_y2": 375.55,
"r_x3": 50.11,
"r_y3": 375.55,
"coord_origin": "TOPLEFT"
},
"text": "is naturally ordered, therefore the hidden states of the table",
"orig": "is naturally ordered, therefore the hidden states of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.41,
"r_x1": 286.37,
"r_y1": 396.41,
"r_x2": 286.37,
"r_y2": 387.5,
"r_x3": 50.11,
"r_y3": 387.5,
"coord_origin": "TOPLEFT"
},
"text": "data cells are also in order when they are provided as in-",
"orig": "data cells are also in order when they are provided as in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 408.37,
"r_x1": 88.69,
"r_y1": 408.37,
"r_x2": 88.69,
"r_y2": 399.46,
"r_x3": 50.11,
"r_y3": 399.46,
"coord_origin": "TOPLEFT"
},
"text": "put to the",
"orig": "put to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.65,
"r_y0": 408.14,
"r_x1": 170.05,
"r_y1": 408.14,
"r_x2": 170.05,
"r_y2": 399.55,
"r_x3": 91.65,
"r_y3": 399.55,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.05,
"r_y0": 408.37,
"r_x1": 286.36,
"r_y1": 408.37,
"r_x2": 286.36,
"r_y2": 399.46,
"r_x3": 170.05,
"r_y3": 399.46,
"coord_origin": "TOPLEFT"
},
"text": ", and 2) Our bounding boxes",
"orig": ", and 2) Our bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 420.32,
"r_x1": 181.97,
"r_y1": 420.32,
"r_x2": 181.97,
"r_y2": 411.41,
"r_x3": 50.11,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "generation mechanism (see Sec.",
"orig": "generation mechanism (see Sec.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.09,
"r_y0": 420.32,
"r_x1": 197.75,
"r_y1": 420.32,
"r_x2": 197.75,
"r_y2": 411.41,
"r_x3": 189.09,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "3)",
"orig": "3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.35,
"r_y0": 420.32,
"r_x1": 286.37,
"r_y1": 420.32,
"r_x2": 286.37,
"r_y2": 411.41,
"r_x3": 200.35,
"r_y3": 411.41,
"coord_origin": "TOPLEFT"
},
"text": "ensures a one-to-one",
"orig": "ensures a one-to-one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 432.28,
"r_x1": 286.37,
"r_y1": 432.28,
"r_x2": 286.37,
"r_y2": 423.37,
"r_x3": 50.11,
"r_y3": 423.37,
"coord_origin": "TOPLEFT"
},
"text": "mapping between the cell content and its bounding box for",
"orig": "mapping between the cell content and its bounding box for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 444.23,
"r_x1": 158.3,
"r_y1": 444.23,
"r_x2": 158.3,
"r_y2": 435.32,
"r_x3": 50.11,
"r_y3": 435.32,
"coord_origin": "TOPLEFT"
},
"text": "all post-processed datasets.",
"orig": "all post-processed datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l$_{s}$ ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l$_{box}$ . l$_{box}$ consists of the generally used l$_{1}$ loss for object detection and the IoU loss ( l$_{iou}$ ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets."
},
{
"label": "text",
"id": 11,
"page_no": 5,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 448.01,
"r": 286.36,
"b": 468.87,
"coord_origin": "TOPLEFT"
},
"confidence": 0.972,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 456.92,
"r_x1": 286.36,
"r_y1": 456.92,
"r_x2": 286.36,
"r_y2": 448.01,
"r_x3": 62.07,
"r_y3": 448.01,
"coord_origin": "TOPLEFT"
},
"text": "The loss used to train the TableFormer can be defined as",
"orig": "The loss used to train the TableFormer can be defined as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 468.87,
"r_x1": 91.38,
"r_y1": 468.87,
"r_x2": 91.38,
"r_y2": 459.97,
"r_x3": 50.11,
"r_y3": 459.97,
"coord_origin": "TOPLEFT"
},
"text": "following:",
"orig": "following:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The loss used to train the TableFormer can be defined as following:"
},
{
"label": "formula",
"id": 15,
"page_no": 5,
"cluster": {
"id": 15,
"label": "formula",
"bbox": {
"l": 124.33,
"t": 493.28,
"r": 286.36,
"b": 517.07,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.72,
"r_y0": 502.13,
"r_x1": 140.64,
"r_y1": 502.13,
"r_x2": 140.64,
"r_y2": 493.28,
"r_x3": 125.72,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.91,
"r_y0": 502.13,
"r_x1": 151.66,
"r_y1": 502.13,
"r_x2": 151.66,
"r_y2": 493.28,
"r_x3": 143.91,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.42,
"r_y0": 502.13,
"r_x1": 186.63,
"r_y1": 502.13,
"r_x2": 186.63,
"r_y2": 493.28,
"r_x3": 154.42,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$l$_{iou}$",
"orig": "\u03bb$_{iou}$l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.34,
"r_y0": 502.13,
"r_x1": 197.09,
"r_y1": 502.13,
"r_x2": 197.09,
"r_y2": 493.28,
"r_x3": 189.34,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "+",
"orig": "+",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.3,
"r_y0": 502.13,
"r_x1": 211.65,
"r_y1": 502.13,
"r_x2": 211.65,
"r_y2": 493.28,
"r_x3": 199.3,
"r_y3": 493.28,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.33,
"r_y0": 517.07,
"r_x1": 127.3,
"r_y1": 517.07,
"r_x2": 127.3,
"r_y2": 508.22,
"r_x3": 124.33,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "l",
"orig": "l",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.27,
"r_y0": 517.07,
"r_x1": 138.01,
"r_y1": 517.07,
"r_x2": 138.01,
"r_y2": 508.22,
"r_x3": 130.27,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.78,
"r_y0": 517.07,
"r_x1": 153.33,
"r_y1": 517.07,
"r_x2": 153.33,
"r_y2": 508.22,
"r_x3": 140.78,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "\u03bbl$_{s}$",
"orig": "\u03bbl$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.04,
"r_y0": 517.07,
"r_x1": 174.86,
"r_y1": 517.07,
"r_x2": 174.86,
"r_y2": 508.22,
"r_x3": 156.04,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "+ (1",
"orig": "+ (1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 177.07,
"r_y0": 517.07,
"r_x1": 184.82,
"r_y1": 517.07,
"r_x2": 184.82,
"r_y2": 507.67,
"r_x3": 177.07,
"r_y3": 507.67,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.03,
"r_y0": 517.07,
"r_x1": 192.84,
"r_y1": 517.07,
"r_x2": 192.84,
"r_y2": 508.22,
"r_x3": 187.03,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 192.85,
"r_y0": 517.07,
"r_x1": 196.72,
"r_y1": 517.07,
"r_x2": 196.72,
"r_y2": 508.22,
"r_x3": 192.85,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.72,
"r_y0": 517.07,
"r_x1": 211.65,
"r_y1": 517.07,
"r_x2": 211.65,
"r_y2": 508.22,
"r_x3": 196.72,
"r_y3": 508.22,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 509.92,
"r_x1": 286.36,
"r_y1": 509.92,
"r_x2": 286.36,
"r_y2": 501.01,
"r_x3": 274.75,
"r_y3": 501.01,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "l$_{box}$ = \u03bb$_{iou}$l$_{iou}$ + \u03bb$_{l}$$_{1}$ l = \u03bbl$_{s}$ + (1 \u2212 \u03bb ) l$_{box}$ (1)"
},
{
"label": "text",
"id": 16,
"page_no": 5,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 50.11,
"t": 530.59,
"r": 281.6,
"b": 540.22,
"coord_origin": "TOPLEFT"
},
"confidence": 0.936,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 540.22,
"r_x1": 74.45,
"r_y1": 540.22,
"r_x2": 74.45,
"r_y2": 531.31,
"r_x3": 50.11,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.94,
"r_y0": 540.0,
"r_x1": 82.75,
"r_y1": 540.0,
"r_x2": 82.75,
"r_y2": 531.15,
"r_x3": 76.94,
"r_y3": 531.15,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.52,
"r_y0": 540.0,
"r_x1": 92.16,
"r_y1": 540.0,
"r_x2": 92.16,
"r_y2": 530.59,
"r_x3": 85.52,
"r_y3": 530.59,
"coord_origin": "TOPLEFT"
},
"text": "\u2208",
"orig": "\u2208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.65,
"r_y0": 540.22,
"r_x1": 135.6,
"r_y1": 540.22,
"r_x2": 135.6,
"r_y2": 531.31,
"r_x3": 94.65,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "[0, 1], and",
"orig": "[0, 1], and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.09,
"r_y0": 540.0,
"r_x1": 172.63,
"r_y1": 540.0,
"r_x2": 172.63,
"r_y2": 531.15,
"r_x3": 138.09,
"r_y3": 531.15,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.9,
"r_y0": 540.0,
"r_x1": 192.5,
"r_y1": 540.0,
"r_x2": 192.5,
"r_y2": 530.59,
"r_x3": 175.9,
"r_y3": 530.59,
"coord_origin": "TOPLEFT"
},
"text": "\u2208$_{R}$",
"orig": "\u2208$_{R}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 194.99,
"r_y0": 540.22,
"r_x1": 281.6,
"r_y1": 540.22,
"r_x2": 281.6,
"r_y2": 531.31,
"r_x3": 194.99,
"r_y3": 531.31,
"coord_origin": "TOPLEFT"
},
"text": "are hyper-parameters.",
"orig": "are hyper-parameters.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where \u03bb \u2208 [0, 1], and \u03bb$_{iou}$, \u03bb$_{l}$$_{1}$ \u2208$_{R}$ are hyper-parameters."
},
{
"label": "section_header",
"id": 12,
"page_no": 5,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 555.92,
"r": 171.98,
"b": 566.66,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 566.66,
"r_x1": 57.93,
"r_y1": 566.66,
"r_x2": 57.93,
"r_y2": 555.92,
"r_x3": 50.11,
"r_y3": 555.92,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.35,
"r_y0": 566.66,
"r_x1": 171.98,
"r_y1": 566.66,
"r_x2": 171.98,
"r_y2": 555.92,
"r_x3": 68.35,
"r_y3": 555.92,
"coord_origin": "TOPLEFT"
},
"text": "Experimental Results",
"orig": "Experimental Results",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Experimental Results"
},
{
"label": "section_header",
"id": 13,
"page_no": 5,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 576.26,
"r": 179.18,
"b": 586.12,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 586.12,
"r_x1": 64.69,
"r_y1": 586.12,
"r_x2": 64.69,
"r_y2": 576.26,
"r_x3": 50.11,
"r_y3": 576.26,
"coord_origin": "TOPLEFT"
},
"text": "5.1.",
"orig": "5.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.41,
"r_y0": 586.12,
"r_x1": 179.18,
"r_y1": 586.12,
"r_x2": 179.18,
"r_y2": 576.26,
"r_x3": 74.41,
"r_y3": 576.26,
"coord_origin": "TOPLEFT"
},
"text": "Implementation Details",
"orig": "Implementation Details",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.1. Implementation Details"
},
{
"label": "text",
"id": 7,
"page_no": 5,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 595.73,
"r": 286.37,
"b": 640.51,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 604.64,
"r_x1": 202.98,
"r_y1": 604.64,
"r_x2": 202.98,
"r_y2": 595.73,
"r_x3": 62.07,
"r_y3": 595.73,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer uses ResNet-18 as the",
"orig": "TableFormer uses ResNet-18 as the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.38,
"r_y0": 604.41,
"r_x1": 286.36,
"r_y1": 604.41,
"r_x2": 286.36,
"r_y2": 595.82,
"r_x3": 205.38,
"r_y3": 595.82,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Net-",
"orig": "CNN Backbone Net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 616.37,
"r_x1": 70.04,
"r_y1": 616.37,
"r_x2": 70.04,
"r_y2": 607.78,
"r_x3": 50.11,
"r_y3": 607.78,
"coord_origin": "TOPLEFT"
},
"text": "work",
"orig": "work",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 616.6,
"r_x1": 286.36,
"r_y1": 616.6,
"r_x2": 286.36,
"r_y2": 607.69,
"r_x3": 70.04,
"r_y3": 607.69,
"coord_origin": "TOPLEFT"
},
"text": ". The input images are resized to 448*448 pixels and",
"orig": ". The input images are resized to 448*448 pixels and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 628.55,
"r_x1": 286.37,
"r_y1": 628.55,
"r_x2": 286.37,
"r_y2": 619.64,
"r_x3": 50.11,
"r_y3": 619.64,
"coord_origin": "TOPLEFT"
},
"text": "the feature map has a dimension of 28*28. Additionally, we",
"orig": "the feature map has a dimension of 28*28. Additionally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 640.51,
"r_x1": 207.03,
"r_y1": 640.51,
"r_x2": 207.03,
"r_y2": 631.6,
"r_x3": 50.11,
"r_y3": 631.6,
"coord_origin": "TOPLEFT"
},
"text": "enforce the following input constraints:",
"orig": "enforce the following input constraints:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:"
},
{
"label": "formula",
"id": 18,
"page_no": 5,
"cluster": {
"id": 18,
"label": "formula",
"bbox": {
"l": 91.66,
"t": 653.83,
"r": 286.36,
"b": 678.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.844,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.66,
"r_y0": 663.45,
"r_x1": 186.02,
"r_y1": 663.45,
"r_x2": 186.02,
"r_y2": 654.55,
"r_x3": 91.66,
"r_y3": 654.55,
"coord_origin": "TOPLEFT"
},
"text": "Image width and height",
"orig": "Image width and height",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.51,
"r_y0": 663.23,
"r_x1": 196.26,
"r_y1": 663.23,
"r_x2": 196.26,
"r_y2": 653.83,
"r_x3": 188.51,
"r_y3": 653.83,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.75,
"r_y0": 663.45,
"r_x1": 244.81,
"r_y1": 663.45,
"r_x2": 244.81,
"r_y2": 654.55,
"r_x3": 198.75,
"r_y3": 654.55,
"coord_origin": "TOPLEFT"
},
"text": "1024 pixels",
"orig": "1024 pixels",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.02,
"r_y0": 678.4,
"r_x1": 186.25,
"r_y1": 678.4,
"r_x2": 186.25,
"r_y2": 669.49,
"r_x3": 101.02,
"r_y3": 669.49,
"coord_origin": "TOPLEFT"
},
"text": "Structural tags length",
"orig": "Structural tags length",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.74,
"r_y0": 678.18,
"r_x1": 196.48,
"r_y1": 678.18,
"r_x2": 196.48,
"r_y2": 668.77,
"r_x3": 188.74,
"r_y3": 668.77,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.98,
"r_y0": 678.4,
"r_x1": 244.81,
"r_y1": 678.4,
"r_x2": 244.81,
"r_y2": 669.49,
"r_x3": 198.98,
"r_y3": 669.49,
"coord_origin": "TOPLEFT"
},
"text": "512 tokens.",
"orig": "512 tokens.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 671.02,
"r_x1": 286.36,
"r_y1": 671.02,
"r_x2": 286.36,
"r_y2": 662.12,
"r_x3": 274.75,
"r_y3": 662.12,
"coord_origin": "TOPLEFT"
},
"text": "(2)",
"orig": "(2)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)"
},
{
"label": "text",
"id": 10,
"page_no": 5,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.11,
"t": 692.29,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.972,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Although input constraints are used also by other methods,",
"orig": "Although input constraints are used also by other methods,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "such as EDD, ours are less restrictive due to the improved",
"orig": "such as EDD, ours are less restrictive due to the improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved"
},
{
"label": "text",
"id": 9,
"page_no": 5,
"cluster": {
"id": 9,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 545.12,
"r_y1": 84.11,
"r_x2": 545.12,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "runtime performance and lower memory footprint of Table-",
"orig": "runtime performance and lower memory footprint of Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 339.99,
"r_y1": 96.07,
"r_x2": 339.99,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "Former.",
"orig": "Former.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.89,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 346.89,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "This allows to utilize input samples with longer",
"orig": "This allows to utilize input samples with longer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 492.96,
"r_y1": 108.02,
"r_x2": 492.96,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "sequences and images with larger dimensions.",
"orig": "sequences and images with larger dimensions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions."
},
{
"label": "text",
"id": 1,
"page_no": 5,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 116.23,
"r": 545.12,
"b": 328.37,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 125.14,
"r_x1": 545.11,
"r_y1": 125.14,
"r_x2": 545.11,
"r_y2": 116.23,
"r_x3": 320.82,
"r_y3": 116.23,
"coord_origin": "TOPLEFT"
},
"text": "The Transformer Encoder consists of two \u201cTransformer",
"orig": "The Transformer Encoder consists of two \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 137.09,
"r_x1": 545.12,
"r_y1": 137.09,
"r_x2": 545.12,
"r_y2": 128.18,
"r_x3": 308.86,
"r_y3": 128.18,
"coord_origin": "TOPLEFT"
},
"text": "Encoder Layers\u201d, with an input feature size of 512, feed",
"orig": "Encoder Layers\u201d, with an input feature size of 512, feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 149.05,
"r_x1": 545.12,
"r_y1": 149.05,
"r_x2": 545.12,
"r_y2": 140.14,
"r_x3": 308.86,
"r_y3": 140.14,
"coord_origin": "TOPLEFT"
},
"text": "forward network of 1024, and 4 attention heads. As for the",
"orig": "forward network of 1024, and 4 attention heads. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 161.0,
"r_x1": 545.12,
"r_y1": 161.0,
"r_x2": 545.12,
"r_y2": 152.09,
"r_x3": 308.86,
"r_y3": 152.09,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder it is composed of four \u201cTransformer",
"orig": "Transformer Decoder it is composed of four \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 172.96,
"r_x1": 545.12,
"r_y1": 172.96,
"r_x2": 545.12,
"r_y2": 164.05,
"r_x3": 308.86,
"r_y3": 164.05,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Layers\u201d with similar input and output dimensions",
"orig": "Decoder Layers\u201d with similar input and output dimensions",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 184.91,
"r_x1": 467.22,
"r_y1": 184.91,
"r_x2": 467.22,
"r_y2": 176.01,
"r_x3": 308.86,
"r_y3": 176.01,
"coord_origin": "TOPLEFT"
},
"text": "as the \u201cTransformer Encoder Layers\u201d.",
"orig": "as the \u201cTransformer Encoder Layers\u201d.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.44,
"r_y0": 184.91,
"r_x1": 545.12,
"r_y1": 184.91,
"r_x2": 545.12,
"r_y2": 176.01,
"r_x3": 475.44,
"r_y3": 176.01,
"coord_origin": "TOPLEFT"
},
"text": "Even though our",
"orig": "Even though our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 196.87,
"r_x1": 545.12,
"r_y1": 196.87,
"r_x2": 545.12,
"r_y2": 187.96,
"r_x3": 308.86,
"r_y3": 187.96,
"coord_origin": "TOPLEFT"
},
"text": "model uses fewer layers and heads than the default imple-",
"orig": "model uses fewer layers and heads than the default imple-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 208.82,
"r_x1": 545.12,
"r_y1": 208.82,
"r_x2": 545.12,
"r_y2": 199.92,
"r_x3": 308.86,
"r_y3": 199.92,
"coord_origin": "TOPLEFT"
},
"text": "mentation parameters, our extensive experimentation has",
"orig": "mentation parameters, our extensive experimentation has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 220.78,
"r_x1": 545.12,
"r_y1": 220.78,
"r_x2": 545.12,
"r_y2": 211.87,
"r_x3": 308.86,
"r_y3": 211.87,
"coord_origin": "TOPLEFT"
},
"text": "proved this setup to be more suitable for table images. We",
"orig": "proved this setup to be more suitable for table images. We",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 232.73,
"r_x1": 545.12,
"r_y1": 232.73,
"r_x2": 545.12,
"r_y2": 223.83,
"r_x3": 308.86,
"r_y3": 223.83,
"coord_origin": "TOPLEFT"
},
"text": "attribute this finding to the inherent design of table im-",
"orig": "attribute this finding to the inherent design of table im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 244.69,
"r_x1": 545.12,
"r_y1": 244.69,
"r_x2": 545.12,
"r_y2": 235.78,
"r_x3": 308.86,
"r_y3": 235.78,
"coord_origin": "TOPLEFT"
},
"text": "ages, which contain mostly lines and text, unlike the more",
"orig": "ages, which contain mostly lines and text, unlike the more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 256.64,
"r_x1": 545.12,
"r_y1": 256.64,
"r_x2": 545.12,
"r_y2": 247.74,
"r_x3": 308.86,
"r_y3": 247.74,
"coord_origin": "TOPLEFT"
},
"text": "elaborate content present in other scopes (e.g. the COCO",
"orig": "elaborate content present in other scopes (e.g. the COCO",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 268.6,
"r_x1": 342.34,
"r_y1": 268.6,
"r_x2": 342.34,
"r_y2": 259.69,
"r_x3": 308.86,
"r_y3": 259.69,
"coord_origin": "TOPLEFT"
},
"text": "dataset).",
"orig": "dataset).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.95,
"r_y0": 268.6,
"r_x1": 545.12,
"r_y1": 268.6,
"r_x2": 545.12,
"r_y2": 259.69,
"r_x3": 348.95,
"r_y3": 259.69,
"coord_origin": "TOPLEFT"
},
"text": "Moreover, we have added ResNet blocks to the",
"orig": "Moreover, we have added ResNet blocks to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 280.55,
"r_x1": 545.12,
"r_y1": 280.55,
"r_x2": 545.12,
"r_y2": 271.65,
"r_x3": 308.86,
"r_y3": 271.65,
"coord_origin": "TOPLEFT"
},
"text": "inputs of the Structure Decoder and Cell BBox Decoder.",
"orig": "inputs of the Structure Decoder and Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 292.51,
"r_x1": 545.12,
"r_y1": 292.51,
"r_x2": 545.12,
"r_y2": 283.6,
"r_x3": 308.86,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "This prevents a decoder having a stronger influence over the",
"orig": "This prevents a decoder having a stronger influence over the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.46,
"r_x1": 545.12,
"r_y1": 304.46,
"r_x2": 545.12,
"r_y2": 295.56,
"r_x3": 308.86,
"r_y3": 295.56,
"coord_origin": "TOPLEFT"
},
"text": "learned weights which would damage the other prediction",
"orig": "learned weights which would damage the other prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.42,
"r_x1": 545.12,
"r_y1": 316.42,
"r_x2": 545.12,
"r_y2": 307.51,
"r_x3": 308.86,
"r_y3": 307.51,
"coord_origin": "TOPLEFT"
},
"text": "task (structure vs bounding boxes), but learn task specific",
"orig": "task (structure vs bounding boxes), but learn task specific",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 328.37,
"r_x1": 532.48,
"r_y1": 328.37,
"r_x2": 532.48,
"r_y2": 319.47,
"r_x3": 308.86,
"r_y3": 319.47,
"coord_origin": "TOPLEFT"
},
"text": "weights instead. Lastly our dropout layers are set to 0.5.",
"orig": "weights instead. Lastly our dropout layers are set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The Transformer Encoder consists of two \"Transformer Encoder Layers\", with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four \"Transformer Decoder Layers\" with similar input and output dimensions as the \"Transformer Encoder Layers\". Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5."
},
{
"label": "text",
"id": 3,
"page_no": 5,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.86,
"t": 336.58,
"r": 545.12,
"b": 429.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 345.48,
"r_x1": 545.11,
"r_y1": 345.48,
"r_x2": 545.11,
"r_y2": 336.58,
"r_x3": 320.82,
"r_y3": 336.58,
"coord_origin": "TOPLEFT"
},
"text": "For training, TableFormer is trained with 3 Adam opti-",
"orig": "For training, TableFormer is trained with 3 Adam opti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 357.44,
"r_x1": 403.74,
"r_y1": 357.44,
"r_x2": 403.74,
"r_y2": 348.53,
"r_x3": 308.86,
"r_y3": 348.53,
"coord_origin": "TOPLEFT"
},
"text": "mizers, each one for the",
"orig": "mizers, each one for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.08,
"r_y0": 357.21,
"r_x1": 503.54,
"r_y1": 357.21,
"r_x2": 503.54,
"r_y2": 348.62,
"r_x3": 406.08,
"r_y3": 348.62,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 503.54,
"r_y0": 357.44,
"r_x1": 506.03,
"r_y1": 357.44,
"r_x2": 506.03,
"r_y2": 348.53,
"r_x3": 503.54,
"r_y3": 348.53,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.4,
"r_y0": 357.21,
"r_x1": 545.11,
"r_y1": 357.21,
"r_x2": 545.11,
"r_y2": 348.62,
"r_x3": 508.4,
"r_y3": 348.62,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 369.16,
"r_x1": 343.16,
"r_y1": 369.16,
"r_x2": 343.16,
"r_y2": 360.58,
"r_x3": 308.86,
"r_y3": 360.58,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.16,
"r_y0": 369.39,
"r_x1": 362.2,
"r_y1": 369.39,
"r_x2": 362.2,
"r_y2": 360.49,
"r_x3": 343.16,
"r_y3": 360.49,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 364.29,
"r_y0": 369.16,
"r_x1": 440.94,
"r_y1": 369.16,
"r_x2": 440.94,
"r_y2": 360.58,
"r_x3": 364.29,
"r_y3": 360.58,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.94,
"r_y0": 369.39,
"r_x1": 545.11,
"r_y1": 369.39,
"r_x2": 545.11,
"r_y2": 360.49,
"r_x3": 440.94,
"r_y3": 360.49,
"coord_origin": "TOPLEFT"
},
"text": ". Taking the PubTabNet as",
"orig": ". Taking the PubTabNet as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 381.35,
"r_x1": 545.12,
"r_y1": 381.35,
"r_x2": 545.12,
"r_y2": 372.44,
"r_x3": 308.86,
"r_y3": 372.44,
"coord_origin": "TOPLEFT"
},
"text": "an example for our parameter set up, the initializing learn-",
"orig": "an example for our parameter set up, the initializing learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 393.31,
"r_x1": 545.12,
"r_y1": 393.31,
"r_x2": 545.12,
"r_y2": 384.4,
"r_x3": 308.86,
"r_y3": 384.4,
"coord_origin": "TOPLEFT"
},
"text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 405.04,
"r_x1": 314.67,
"r_y1": 405.04,
"r_x2": 314.67,
"r_y2": 396.19,
"r_x3": 308.86,
"r_y3": 396.19,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.66,
"r_y0": 405.26,
"r_x1": 360.39,
"r_y1": 405.26,
"r_x2": 360.39,
"r_y2": 396.35,
"r_x3": 318.66,
"r_y3": 396.35,
"coord_origin": "TOPLEFT"
},
"text": "set to 0.5.",
"orig": "set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.96,
"r_y0": 405.26,
"r_x1": 545.11,
"r_y1": 405.26,
"r_x2": 545.11,
"r_y2": 396.35,
"r_x3": 367.96,
"r_y3": 396.35,
"coord_origin": "TOPLEFT"
},
"text": "Afterwards, we reduce the learning rate to",
"orig": "Afterwards, we reduce the learning rate to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 417.21,
"r_x1": 545.12,
"r_y1": 417.21,
"r_x2": 545.12,
"r_y2": 408.31,
"r_x3": 308.86,
"r_y3": 408.31,
"coord_origin": "TOPLEFT"
},
"text": "0.0001, the batch size to 18 and train for 12 more epochs or",
"orig": "0.0001, the batch size to 18 and train for 12 more epochs or",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 429.17,
"r_x1": 360.97,
"r_y1": 429.17,
"r_x2": 360.97,
"r_y2": 420.26,
"r_x3": 308.86,
"r_y3": 420.26,
"coord_origin": "TOPLEFT"
},
"text": "convergence.",
"orig": "convergence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network , Structure Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence."
},
{
"label": "text",
"id": 0,
"page_no": 5,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 437.37,
"r": 545.12,
"b": 553.88,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 446.28,
"r_x1": 545.11,
"r_y1": 446.28,
"r_x2": 545.11,
"r_y2": 437.37,
"r_x3": 320.82,
"r_y3": 437.37,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is implemented with PyTorch and Torchvi-",
"orig": "TableFormer is implemented with PyTorch and Torchvi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 458.24,
"r_x1": 384.63,
"r_y1": 458.24,
"r_x2": 384.63,
"r_y2": 449.33,
"r_x3": 308.86,
"r_y3": 449.33,
"coord_origin": "TOPLEFT"
},
"text": "sion libraries [22].",
"orig": "sion libraries [22].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 458.24,
"r_x1": 545.12,
"r_y1": 458.24,
"r_x2": 545.12,
"r_y2": 449.33,
"r_x3": 391.37,
"r_y3": 449.33,
"coord_origin": "TOPLEFT"
},
"text": "To speed up the inference, the image",
"orig": "To speed up the inference, the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 470.19,
"r_x1": 494.01,
"r_y1": 470.19,
"r_x2": 494.01,
"r_y2": 461.28,
"r_x3": 308.86,
"r_y3": 461.28,
"coord_origin": "TOPLEFT"
},
"text": "undergoes a single forward pass through the",
"orig": "undergoes a single forward pass through the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.08,
"r_y0": 469.96,
"r_x1": 545.11,
"r_y1": 469.96,
"r_x2": 545.11,
"r_y2": 461.37,
"r_x3": 498.08,
"r_y3": 461.37,
"coord_origin": "TOPLEFT"
},
"text": "CNN Back-",
"orig": "CNN Back-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 481.92,
"r_x1": 364.44,
"r_y1": 481.92,
"r_x2": 364.44,
"r_y2": 473.33,
"r_x3": 308.86,
"r_y3": 473.33,
"coord_origin": "TOPLEFT"
},
"text": "bone Network",
"orig": "bone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.06,
"r_y0": 482.15,
"r_x1": 545.11,
"r_y1": 482.15,
"r_x2": 545.11,
"r_y2": 473.24,
"r_x3": 367.06,
"r_y3": 473.24,
"coord_origin": "TOPLEFT"
},
"text": "and transformer encoder. This eliminates the",
"orig": "and transformer encoder. This eliminates the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 494.1,
"r_x1": 545.12,
"r_y1": 494.1,
"r_x2": 545.12,
"r_y2": 485.19,
"r_x3": 308.86,
"r_y3": 485.19,
"coord_origin": "TOPLEFT"
},
"text": "overhead of generating the same features for each decoding",
"orig": "overhead of generating the same features for each decoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 506.06,
"r_x1": 545.12,
"r_y1": 506.06,
"r_x2": 545.12,
"r_y2": 497.15,
"r_x3": 308.86,
"r_y3": 497.15,
"coord_origin": "TOPLEFT"
},
"text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 518.01,
"r_x1": 545.12,
"r_y1": 518.01,
"r_x2": 545.12,
"r_y2": 509.11,
"r_x3": 308.86,
"r_y3": 509.11,
"coord_origin": "TOPLEFT"
},
"text": "faster autoregressive decoding. This is achieved by storing",
"orig": "faster autoregressive decoding. This is achieved by storing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 529.97,
"r_x1": 545.12,
"r_y1": 529.97,
"r_x2": 545.12,
"r_y2": 521.06,
"r_x3": 308.86,
"r_y3": 521.06,
"coord_origin": "TOPLEFT"
},
"text": "the features of decoded tokens so we can reuse them for",
"orig": "the features of decoded tokens so we can reuse them for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 541.92,
"r_x1": 545.12,
"r_y1": 541.92,
"r_x2": 545.12,
"r_y2": 533.02,
"r_x3": 308.86,
"r_y3": 533.02,
"coord_origin": "TOPLEFT"
},
"text": "each time step. Therefore, we only compute the attention",
"orig": "each time step. Therefore, we only compute the attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 553.88,
"r_x1": 377.22,
"r_y1": 553.88,
"r_x2": 377.22,
"r_y2": 544.97,
"r_x3": 308.86,
"r_y3": 544.97,
"coord_origin": "TOPLEFT"
},
"text": "for each new tag.",
"orig": "for each new tag.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag."
},
{
"label": "section_header",
"id": 14,
"page_no": 5,
"cluster": {
"id": 14,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 579.55,
"r": 397.44,
"b": 589.41,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 589.41,
"r_x1": 323.9,
"r_y1": 589.41,
"r_x2": 323.9,
"r_y2": 579.55,
"r_x3": 308.86,
"r_y3": 579.55,
"coord_origin": "TOPLEFT"
},
"text": "5.2.",
"orig": "5.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.93,
"r_y0": 589.41,
"r_x1": 397.44,
"r_y1": 589.41,
"r_x2": 397.44,
"r_y2": 579.55,
"r_x3": 333.93,
"r_y3": 579.55,
"coord_origin": "TOPLEFT"
},
"text": "Generalization",
"orig": "Generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.2. Generalization"
},
{
"label": "text",
"id": 2,
"page_no": 5,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.86,
"t": 603.45,
"r": 545.12,
"b": 672.13,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 612.36,
"r_x1": 545.11,
"r_y1": 612.36,
"r_x2": 545.11,
"r_y2": 603.45,
"r_x3": 320.82,
"r_y3": 603.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is evaluated on three major publicly avail-",
"orig": "TableFormer is evaluated on three major publicly avail-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 624.31,
"r_x1": 545.12,
"r_y1": 624.31,
"r_x2": 545.12,
"r_y2": 615.4,
"r_x3": 308.86,
"r_y3": 615.4,
"coord_origin": "TOPLEFT"
},
"text": "able datasets of different nature to prove the generalization",
"orig": "able datasets of different nature to prove the generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 636.27,
"r_x1": 545.12,
"r_y1": 636.27,
"r_x2": 545.12,
"r_y2": 627.36,
"r_x3": 308.86,
"r_y3": 627.36,
"coord_origin": "TOPLEFT"
},
"text": "and effectiveness of our model. The datasets used for eval-",
"orig": "and effectiveness of our model. The datasets used for eval-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 648.22,
"r_x1": 545.12,
"r_y1": 648.22,
"r_x2": 545.12,
"r_y2": 639.31,
"r_x3": 308.86,
"r_y3": 639.31,
"coord_origin": "TOPLEFT"
},
"text": "uation are the PubTabNet, FinTabNet and TableBank which",
"orig": "uation are the PubTabNet, FinTabNet and TableBank which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 660.18,
"r_x1": 545.12,
"r_y1": 660.18,
"r_x2": 545.12,
"r_y2": 651.27,
"r_x3": 308.86,
"r_y3": 651.27,
"coord_origin": "TOPLEFT"
},
"text": "stem from the scientific, financial and general domains re-",
"orig": "stem from the scientific, financial and general domains re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 672.13,
"r_x1": 350.7,
"r_y1": 672.13,
"r_x2": 350.7,
"r_y2": 663.23,
"r_x3": 308.86,
"r_y3": 663.23,
"coord_origin": "TOPLEFT"
},
"text": "spectively.",
"orig": "spectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively."
},
{
"label": "text",
"id": 8,
"page_no": 5,
"cluster": {
"id": 8,
"label": "text",
"bbox": {
"l": 308.86,
"t": 680.34,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 689.24,
"r_x1": 545.12,
"r_y1": 689.24,
"r_x2": 545.12,
"r_y2": 680.34,
"r_x3": 320.82,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "We also share our baseline results on the challenging",
"orig": "We also share our baseline results on the challenging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 701.2,
"r_x1": 396.21,
"r_y1": 701.2,
"r_x2": 396.21,
"r_y2": 692.29,
"r_x3": 308.86,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet dataset.",
"orig": "SynthTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.41,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 406.41,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Throughout our experiments, the",
"orig": "Throughout our experiments, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 495.94,
"r_y1": 713.15,
"r_x2": 495.94,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "same parameters stated in Sec. 5.1 are utilized.",
"orig": "same parameters stated in Sec. 5.1 are utilized.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized."
}
],
"headers": [
{
"label": "page_footer",
"id": 17,
"page_no": 5,
"cluster": {
"id": 17,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6"
}
]
}
},
{
"page_no": 6,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.25,
"r_x1": 63.7,
"r_y1": 84.25,
"r_x2": 63.7,
"r_y2": 74.4,
"r_x3": 50.11,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3.",
"orig": "5.3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.77,
"r_y0": 84.25,
"r_x1": 167.9,
"r_y1": 84.25,
"r_x2": 167.9,
"r_y2": 74.4,
"r_x3": 72.77,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "Datasets and Metrics",
"orig": "Datasets and Metrics",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 102.26,
"r_x1": 286.36,
"r_y1": 102.26,
"r_x2": 286.36,
"r_y2": 93.35,
"r_x3": 62.07,
"r_y3": 93.35,
"coord_origin": "TOPLEFT"
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 114.21,
"r_x1": 286.37,
"r_y1": 114.21,
"r_x2": 286.37,
"r_y2": 105.31,
"r_x3": 50.11,
"r_y3": 105.31,
"coord_origin": "TOPLEFT"
},
"text": "ric was introduced in [37]. It represents the prediction, and",
"orig": "ric was introduced in [37]. It represents the prediction, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 126.17,
"r_x1": 286.37,
"r_y1": 126.17,
"r_x2": 286.37,
"r_y2": 117.26,
"r_x3": 50.11,
"r_y3": 117.26,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth as a tree structure of HTML tags. This simi-",
"orig": "ground-truth as a tree structure of HTML tags. This simi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 138.12,
"r_x1": 136.72,
"r_y1": 138.12,
"r_x2": 136.72,
"r_y2": 129.22,
"r_x3": 50.11,
"r_y3": 129.22,
"coord_origin": "TOPLEFT"
},
"text": "larity is calculated as:",
"orig": "larity is calculated as:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.22,
"r_y0": 165.9,
"r_x1": 118.88,
"r_y1": 165.9,
"r_x2": 118.88,
"r_y2": 157.06,
"r_x3": 86.22,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": "TEDS (",
"orig": "TEDS (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.87,
"r_y0": 165.9,
"r_x1": 143.27,
"r_y1": 165.9,
"r_x2": 143.27,
"r_y2": 157.06,
"r_x3": 118.87,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.77,
"r_y0": 165.9,
"r_x1": 165.9,
"r_y1": 165.9,
"r_x2": 165.9,
"r_y2": 157.06,
"r_x3": 143.77,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": ") = 1",
"orig": ") = 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.12,
"r_y0": 165.9,
"r_x1": 175.87,
"r_y1": 165.9,
"r_x2": 175.87,
"r_y2": 156.5,
"r_x3": 168.12,
"r_y3": 156.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 179.28,
"r_y0": 159.16,
"r_x1": 221.96,
"r_y1": 159.16,
"r_x2": 221.96,
"r_y2": 150.32,
"r_x3": 179.28,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": "EditDist (",
"orig": "EditDist (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.95,
"r_y0": 159.16,
"r_x1": 246.35,
"r_y1": 159.16,
"r_x2": 246.35,
"r_y2": 150.32,
"r_x3": 221.95,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.84,
"r_y0": 159.16,
"r_x1": 250.72,
"r_y1": 159.16,
"r_x2": 250.72,
"r_y2": 150.32,
"r_x3": 246.84,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.21,
"r_y0": 172.74,
"r_x1": 206.29,
"r_y1": 172.74,
"r_x2": 206.29,
"r_y2": 163.89,
"r_x3": 182.21,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "max (",
"orig": "max (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.29,
"r_y0": 172.74,
"r_x1": 209.06,
"r_y1": 172.74,
"r_x2": 209.06,
"r_y2": 163.33,
"r_x3": 206.29,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.06,
"r_y0": 172.74,
"r_x1": 219.2,
"r_y1": 172.74,
"r_x2": 219.2,
"r_y2": 163.89,
"r_x3": 209.06,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.7,
"r_y0": 172.74,
"r_x1": 222.46,
"r_y1": 172.74,
"r_x2": 222.46,
"r_y2": 163.33,
"r_x3": 219.7,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.12,
"r_y0": 172.74,
"r_x1": 226.89,
"r_y1": 172.74,
"r_x2": 226.89,
"r_y2": 163.89,
"r_x3": 224.12,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.55,
"r_y0": 172.74,
"r_x1": 231.32,
"r_y1": 172.74,
"r_x2": 231.32,
"r_y2": 163.33,
"r_x3": 228.55,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.32,
"r_y0": 172.74,
"r_x1": 240.65,
"r_y1": 172.74,
"r_x2": 240.65,
"r_y2": 163.89,
"r_x3": 231.32,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.14,
"r_y0": 172.74,
"r_x1": 243.91,
"r_y1": 172.74,
"r_x2": 243.91,
"r_y2": 163.33,
"r_x3": 241.14,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.91,
"r_y0": 172.74,
"r_x1": 247.79,
"r_y1": 172.74,
"r_x2": 247.79,
"r_y2": 163.89,
"r_x3": 243.91,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 166.12,
"r_x1": 286.36,
"r_y1": 166.12,
"r_x2": 286.36,
"r_y2": 157.22,
"r_x3": 274.75,
"r_y3": 157.22,
"coord_origin": "TOPLEFT"
},
"text": "(3)",
"orig": "(3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 190.07,
"r_x1": 86.41,
"r_y1": 190.07,
"r_x2": 86.41,
"r_y2": 181.16,
"r_x3": 62.07,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.58,
"r_y0": 189.85,
"r_x1": 98.72,
"r_y1": 189.85,
"r_x2": 98.72,
"r_y2": 181.0,
"r_x3": 88.58,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.4,
"r_y0": 190.07,
"r_x1": 115.78,
"r_y1": 190.07,
"r_x2": 115.78,
"r_y2": 181.16,
"r_x3": 101.4,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.96,
"r_y0": 189.85,
"r_x1": 127.29,
"r_y1": 189.85,
"r_x2": 127.29,
"r_y2": 181.0,
"r_x3": 117.96,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.96,
"r_y0": 190.07,
"r_x1": 286.36,
"r_y1": 190.07,
"r_x2": 286.36,
"r_y2": 181.16,
"r_x3": 129.96,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "represent tables in tree structure HTML",
"orig": "represent tables in tree structure HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 202.02,
"r_x1": 252.78,
"r_y1": 202.02,
"r_x2": 252.78,
"r_y2": 193.12,
"r_x3": 50.11,
"r_y3": 193.12,
"coord_origin": "TOPLEFT"
},
"text": "format. EditDist denotes the tree-edit distance, and",
"orig": "format. EditDist denotes the tree-edit distance, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.18,
"r_y0": 201.8,
"r_x1": 257.95,
"r_y1": 201.8,
"r_x2": 257.95,
"r_y2": 192.4,
"r_x3": 255.18,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 257.95,
"r_y0": 201.8,
"r_x1": 263.77,
"r_y1": 201.8,
"r_x2": 263.77,
"r_y2": 192.96,
"r_x3": 257.95,
"r_y3": 192.96,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 265.15,
"r_y0": 201.8,
"r_x1": 267.92,
"r_y1": 201.8,
"r_x2": 267.92,
"r_y2": 192.4,
"r_x3": 265.15,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.32,
"r_y0": 202.02,
"r_x1": 286.36,
"r_y1": 202.02,
"r_x2": 286.36,
"r_y2": 193.12,
"r_x3": 270.32,
"r_y3": 193.12,
"coord_origin": "TOPLEFT"
},
"text": "rep-",
"orig": "rep-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 213.98,
"r_x1": 172.13,
"r_y1": 213.98,
"r_x2": 172.13,
"r_y2": 205.07,
"r_x3": 50.11,
"r_y3": 205.07,
"coord_origin": "TOPLEFT"
},
"text": "resents the number of nodes in",
"orig": "resents the number of nodes in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.62,
"r_y0": 213.76,
"r_x1": 180.45,
"r_y1": 213.76,
"r_x2": 180.45,
"r_y2": 204.91,
"r_x3": 174.62,
"r_y3": 204.91,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.83,
"r_y0": 213.98,
"r_x1": 184.32,
"r_y1": 213.98,
"r_x2": 184.32,
"r_y2": 205.07,
"r_x3": 181.83,
"r_y3": 205.07,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 234.67,
"r_x1": 64.55,
"r_y1": 234.67,
"r_x2": 64.55,
"r_y2": 224.82,
"r_x3": 50.11,
"r_y3": 224.82,
"coord_origin": "TOPLEFT"
},
"text": "5.4.",
"orig": "5.4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.18,
"r_y0": 234.67,
"r_x1": 170.45,
"r_y1": 234.67,
"r_x2": 170.45,
"r_y2": 224.82,
"r_x3": 74.18,
"r_y3": 224.82,
"coord_origin": "TOPLEFT"
},
"text": "Quantitative Analysis",
"orig": "Quantitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 252.61,
"r_x1": 105.32,
"r_y1": 252.61,
"r_x2": 105.32,
"r_y2": 243.65,
"r_x3": 62.07,
"r_y3": 243.65,
"coord_origin": "TOPLEFT"
},
"text": "Structure.",
"orig": "Structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.13,
"r_y0": 252.68,
"r_x1": 184.68,
"r_y1": 252.68,
"r_x2": 184.68,
"r_y2": 243.77,
"r_x3": 112.13,
"r_y3": 243.77,
"coord_origin": "TOPLEFT"
},
"text": "As shown in Tab.",
"orig": "As shown in Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 191.48,
"r_y0": 252.68,
"r_x1": 286.36,
"r_y1": 252.68,
"r_x2": 286.36,
"r_y2": 243.77,
"r_x3": 191.48,
"r_y3": 243.77,
"coord_origin": "TOPLEFT"
},
"text": "2, TableFormer outper-",
"orig": "2, TableFormer outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.63,
"r_x1": 286.37,
"r_y1": 264.63,
"r_x2": 286.37,
"r_y2": 255.72,
"r_x3": 50.11,
"r_y3": 255.72,
"coord_origin": "TOPLEFT"
},
"text": "forms all SOTA methods across different datasets by a large",
"orig": "forms all SOTA methods across different datasets by a large",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.59,
"r_x1": 286.37,
"r_y1": 276.59,
"r_x2": 286.37,
"r_y2": 267.68,
"r_x3": 50.11,
"r_y3": 267.68,
"coord_origin": "TOPLEFT"
},
"text": "margin for predicting the table structure from an image.",
"orig": "margin for predicting the table structure from an image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.54,
"r_x1": 286.37,
"r_y1": 288.54,
"r_x2": 286.37,
"r_y2": 279.63,
"r_x3": 50.11,
"r_y3": 279.63,
"coord_origin": "TOPLEFT"
},
"text": "All the more, our model outperforms pre-trained methods.",
"orig": "All the more, our model outperforms pre-trained methods.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.5,
"r_x1": 286.37,
"r_y1": 300.5,
"r_x2": 286.37,
"r_y2": 291.59,
"r_x3": 50.11,
"r_y3": 291.59,
"coord_origin": "TOPLEFT"
},
"text": "During the evaluation we do not apply any table filtering.",
"orig": "During the evaluation we do not apply any table filtering.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.45,
"r_x1": 286.37,
"r_y1": 312.45,
"r_x2": 286.37,
"r_y2": 303.55,
"r_x3": 50.11,
"r_y3": 303.55,
"coord_origin": "TOPLEFT"
},
"text": "We also provide our baseline results on the SynthTabNet",
"orig": "We also provide our baseline results on the SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.41,
"r_x1": 286.37,
"r_y1": 324.41,
"r_x2": 286.37,
"r_y2": 315.5,
"r_x3": 50.11,
"r_y3": 315.5,
"coord_origin": "TOPLEFT"
},
"text": "dataset. It has been observed that large tables (e.g. tables",
"orig": "dataset. It has been observed that large tables (e.g. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.36,
"r_x1": 286.37,
"r_y1": 336.36,
"r_x2": 286.37,
"r_y2": 327.46,
"r_x3": 50.11,
"r_y3": 327.46,
"coord_origin": "TOPLEFT"
},
"text": "that occupy half of the page or more) yield poor predictions.",
"orig": "that occupy half of the page or more) yield poor predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.32,
"r_x1": 286.37,
"r_y1": 348.32,
"r_x2": 286.37,
"r_y2": 339.41,
"r_x3": 50.11,
"r_y3": 339.41,
"coord_origin": "TOPLEFT"
},
"text": "We attribute this issue to the image resizing during the pre-",
"orig": "We attribute this issue to the image resizing during the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 360.27,
"r_x1": 286.37,
"r_y1": 360.27,
"r_x2": 286.37,
"r_y2": 351.37,
"r_x3": 50.11,
"r_y3": 351.37,
"coord_origin": "TOPLEFT"
},
"text": "processing step, that produces downsampled images with",
"orig": "processing step, that produces downsampled images with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 372.23,
"r_x1": 286.37,
"r_y1": 372.23,
"r_x2": 286.37,
"r_y2": 363.32,
"r_x3": 50.11,
"r_y3": 363.32,
"coord_origin": "TOPLEFT"
},
"text": "indistinguishable features. This problem can be addressed",
"orig": "indistinguishable features. This problem can be addressed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 384.18,
"r_x1": 286.37,
"r_y1": 384.18,
"r_x2": 286.37,
"r_y2": 375.28,
"r_x3": 50.11,
"r_y3": 375.28,
"coord_origin": "TOPLEFT"
},
"text": "by treating such big tables with a separate model which ac-",
"orig": "by treating such big tables with a separate model which ac-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.14,
"r_x1": 170.01,
"r_y1": 396.14,
"r_x2": 170.01,
"r_y2": 387.23,
"r_x3": 50.11,
"r_y3": 387.23,
"coord_origin": "TOPLEFT"
},
"text": "cepts a large input image size.",
"orig": "cepts a large input image size.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 601.34,
"r_x1": 286.37,
"r_y1": 601.34,
"r_x2": 286.37,
"r_y2": 592.43,
"r_x3": 50.11,
"r_y3": 592.43,
"coord_origin": "TOPLEFT"
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 613.29,
"r_x1": 247.46,
"r_y1": 613.29,
"r_x2": 247.46,
"r_y2": 604.39,
"r_x3": 50.11,
"r_y3": 604.39,
"coord_origin": "TOPLEFT"
},
"text": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"orig": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 625.25,
"r_x1": 261.79,
"r_y1": 625.25,
"r_x2": 261.79,
"r_y2": 616.34,
"r_x3": 50.11,
"r_y3": 616.34,
"coord_origin": "TOPLEFT"
},
"text": "FT: Model was trained on PubTabNet then finetuned.",
"orig": "FT: Model was trained on PubTabNet then finetuned.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 653.31,
"r_x1": 124.72,
"r_y1": 653.31,
"r_x2": 124.72,
"r_y2": 644.35,
"r_x3": 62.07,
"r_y3": 644.35,
"coord_origin": "TOPLEFT"
},
"text": "Cell Detection.",
"orig": "Cell Detection.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.2,
"r_y0": 653.38,
"r_x1": 242.93,
"r_y1": 653.38,
"r_x2": 242.93,
"r_y2": 644.47,
"r_x3": 128.2,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "Like any object detector, our",
"orig": "Like any object detector, our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.55,
"r_y0": 653.15,
"r_x1": 286.36,
"r_y1": 653.15,
"r_x2": 286.36,
"r_y2": 644.56,
"r_x3": 245.55,
"r_y3": 644.56,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.1,
"r_x1": 84.97,
"r_y1": 665.1,
"r_x2": 84.97,
"r_y2": 656.51,
"r_x3": 50.11,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "Detector",
"orig": "Detector",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.52,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 89.52,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "provides bounding boxes that can be improved",
"orig": "provides bounding boxes that can be improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "with post-processing during inference. We make use of the",
"orig": "with post-processing during inference. We make use of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "grid-like structure of tables to refine the predictions. A de-",
"orig": "grid-like structure of tables to refine the predictions. A de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "tailed explanation on the post-processing is available in the",
"orig": "tailed explanation on the post-processing is available in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "supplementary material. As shown in Tab. 3, we evaluate",
"orig": "supplementary material. As shown in Tab. 3, we evaluate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 322.14,
"r_y1": 84.11,
"r_x2": 322.14,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "our",
"orig": "our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.45,
"r_y0": 83.89,
"r_x1": 404.57,
"r_y1": 83.89,
"r_x2": 404.57,
"r_y2": 75.3,
"r_x3": 325.45,
"r_y3": 75.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 84.11,
"r_x1": 545.11,
"r_y1": 84.11,
"r_x2": 545.11,
"r_y2": 75.21,
"r_x3": 408.1,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "accuracy for cells with a class la-",
"orig": "accuracy for cells with a class la-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 470.23,
"r_y1": 108.02,
"r_x2": 470.23,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "for pre-processing and post-processing.",
"orig": "for pre-processing and post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.53,
"r_y0": 108.02,
"r_x1": 545.12,
"r_y1": 108.02,
"r_x2": 545.12,
"r_y2": 99.12,
"r_x3": 477.53,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "Note that we do",
"orig": "Note that we do",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 119.98,
"r_x1": 545.12,
"r_y1": 119.98,
"r_x2": 545.12,
"r_y2": 111.07,
"r_x3": 308.86,
"r_y3": 111.07,
"coord_origin": "TOPLEFT"
},
"text": "not have post-processing results for SynthTabNet as images",
"orig": "not have post-processing results for SynthTabNet as images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 131.93,
"r_x1": 545.12,
"r_y1": 131.93,
"r_x2": 545.12,
"r_y2": 123.03,
"r_x3": 308.86,
"r_y3": 123.03,
"coord_origin": "TOPLEFT"
},
"text": "are only provided. To compare the performance of our pro-",
"orig": "are only provided. To compare the performance of our pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 143.89,
"r_x1": 502.02,
"r_y1": 143.89,
"r_x2": 502.02,
"r_y2": 134.98,
"r_x3": 308.86,
"r_y3": 134.98,
"coord_origin": "TOPLEFT"
},
"text": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"orig": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 504.47,
"r_y0": 143.66,
"r_x1": 545.11,
"r_y1": 143.66,
"r_x2": 545.11,
"r_y2": 135.07,
"r_x3": 504.47,
"r_y3": 135.07,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 155.62,
"r_x1": 343.16,
"r_y1": 155.62,
"r_x2": 343.16,
"r_y2": 147.03,
"r_x3": 308.86,
"r_y3": 147.03,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.37,
"r_y0": 155.85,
"r_x1": 545.11,
"r_y1": 155.85,
"r_x2": 545.11,
"r_y2": 146.94,
"r_x3": 346.37,
"r_y3": 146.94,
"coord_origin": "TOPLEFT"
},
"text": "into EDD architecture. As mentioned previously,",
"orig": "into EDD architecture. As mentioned previously,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 167.8,
"r_x1": 446.16,
"r_y1": 167.8,
"r_x2": 446.16,
"r_y2": 158.89,
"r_x3": 308.86,
"r_y3": 158.89,
"coord_origin": "TOPLEFT"
},
"text": "the Structure Decoder provides the",
"orig": "the Structure Decoder provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.29,
"r_y0": 167.57,
"r_x1": 525.04,
"r_y1": 167.57,
"r_x2": 525.04,
"r_y2": 158.98,
"r_x3": 448.29,
"r_y3": 158.98,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.4,
"r_y0": 167.8,
"r_x1": 545.11,
"r_y1": 167.8,
"r_x2": 545.11,
"r_y2": 158.89,
"r_x3": 527.4,
"r_y3": 158.89,
"coord_origin": "TOPLEFT"
},
"text": "with",
"orig": "with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 179.76,
"r_x1": 545.12,
"r_y1": 179.76,
"r_x2": 545.12,
"r_y2": 170.85,
"r_x3": 308.86,
"r_y3": 170.85,
"coord_origin": "TOPLEFT"
},
"text": "the features needed to predict the bounding box predictions.",
"orig": "the features needed to predict the bounding box predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 191.71,
"r_x1": 432.87,
"r_y1": 191.71,
"r_x2": 432.87,
"r_y2": 182.8,
"r_x3": 308.86,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "Therefore, the accuracy of the",
"orig": "Therefore, the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.39,
"r_y0": 191.48,
"r_x1": 510.93,
"r_y1": 191.48,
"r_x2": 510.93,
"r_y2": 182.89,
"r_x3": 436.39,
"r_y3": 182.89,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.68,
"r_y0": 191.71,
"r_x1": 545.11,
"r_y1": 191.71,
"r_x2": 545.11,
"r_y2": 182.8,
"r_x3": 514.68,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "directly",
"orig": "directly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 203.67,
"r_x1": 431.17,
"r_y1": 203.67,
"r_x2": 431.17,
"r_y2": 194.76,
"r_x3": 308.86,
"r_y3": 194.76,
"coord_origin": "TOPLEFT"
},
"text": "influences the accuracy of the",
"orig": "influences the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.68,
"r_y0": 203.44,
"r_x1": 514.18,
"r_y1": 203.44,
"r_x2": 514.18,
"r_y2": 194.85,
"r_x3": 434.68,
"r_y3": 194.85,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.18,
"r_y0": 203.67,
"r_x1": 545.11,
"r_y1": 203.67,
"r_x2": 545.11,
"r_y2": 194.76,
"r_x3": 514.18,
"r_y3": 194.76,
"coord_origin": "TOPLEFT"
},
"text": ". If the",
"orig": ". If the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 215.39,
"r_x1": 382.36,
"r_y1": 215.39,
"r_x2": 382.36,
"r_y2": 206.81,
"r_x3": 308.86,
"r_y3": 206.81,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.08,
"r_y0": 215.62,
"r_x1": 545.11,
"r_y1": 215.62,
"r_x2": 545.11,
"r_y2": 206.72,
"r_x3": 385.08,
"r_y3": 206.72,
"coord_origin": "TOPLEFT"
},
"text": "predicts an extra column, this will result",
"orig": "predicts an extra column, this will result",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 227.58,
"r_x1": 501.7,
"r_y1": 227.58,
"r_x2": 501.7,
"r_y2": 218.67,
"r_x3": 308.86,
"r_y3": 218.67,
"coord_origin": "TOPLEFT"
},
"text": "in an extra column of predicted bounding boxes.",
"orig": "in an extra column of predicted bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 325.36,
"r_x1": 341.5,
"r_y1": 325.36,
"r_x2": 341.5,
"r_y2": 316.45,
"r_x3": 308.86,
"r_y3": 316.45,
"coord_origin": "TOPLEFT"
},
"text": "Table 3:",
"orig": "Table 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.6,
"r_y0": 325.36,
"r_x1": 545.12,
"r_y1": 325.36,
"r_x2": 545.12,
"r_y2": 316.45,
"r_x3": 348.6,
"r_y3": 316.45,
"coord_origin": "TOPLEFT"
},
"text": "Cell Bounding Box detection results on PubTab-",
"orig": "Cell Bounding Box detection results on PubTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 337.31,
"r_x1": 474.98,
"r_y1": 337.31,
"r_x2": 474.98,
"r_y2": 328.4,
"r_x3": 308.86,
"r_y3": 328.4,
"coord_origin": "TOPLEFT"
},
"text": "Net, and FinTabNet. PP: Post-processing.",
"orig": "Net, and FinTabNet. PP: Post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 376.64,
"r_x1": 378.95,
"r_y1": 376.64,
"r_x2": 378.95,
"r_y2": 367.68,
"r_x3": 320.82,
"r_y3": 367.68,
"coord_origin": "TOPLEFT"
},
"text": "Cell Content.",
"orig": "Cell Content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 387.08,
"r_y0": 376.71,
"r_x1": 545.12,
"r_y1": 376.71,
"r_x2": 545.12,
"r_y2": 367.8,
"r_x3": 387.08,
"r_y3": 367.8,
"coord_origin": "TOPLEFT"
},
"text": "In this section, we evaluate the entire",
"orig": "In this section, we evaluate the entire",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 388.66,
"r_x1": 487.19,
"r_y1": 388.66,
"r_x2": 487.19,
"r_y2": 379.75,
"r_x3": 308.86,
"r_y3": 379.75,
"coord_origin": "TOPLEFT"
},
"text": "pipeline of recovering a table with content.",
"orig": "pipeline of recovering a table with content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.97,
"r_y0": 388.66,
"r_x1": 545.12,
"r_y1": 388.66,
"r_x2": 545.12,
"r_y2": 379.75,
"r_x3": 493.97,
"r_y3": 379.75,
"coord_origin": "TOPLEFT"
},
"text": "Here we put",
"orig": "Here we put",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.62,
"r_x1": 545.12,
"r_y1": 400.62,
"r_x2": 545.12,
"r_y2": 391.71,
"r_x3": 308.86,
"r_y3": 391.71,
"coord_origin": "TOPLEFT"
},
"text": "our approach to test by capitalizing on extracting content",
"orig": "our approach to test by capitalizing on extracting content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.57,
"r_x1": 545.12,
"r_y1": 412.57,
"r_x2": 545.12,
"r_y2": 403.67,
"r_x3": 308.86,
"r_y3": 403.67,
"coord_origin": "TOPLEFT"
},
"text": "from the PDF cells rather than decoding from images. Tab.",
"orig": "from the PDF cells rather than decoding from images. Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.53,
"r_x1": 314.08,
"r_y1": 424.53,
"r_x2": 314.08,
"r_y2": 415.62,
"r_x3": 308.86,
"r_y3": 415.62,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.69,
"r_y0": 424.53,
"r_x1": 545.12,
"r_y1": 424.53,
"r_x2": 545.12,
"r_y2": 415.62,
"r_x3": 316.69,
"r_y3": 415.62,
"coord_origin": "TOPLEFT"
},
"text": "shows the TEDs score of HTML code representing the",
"orig": "shows the TEDs score of HTML code representing the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.48,
"r_x1": 545.12,
"r_y1": 436.48,
"r_x2": 545.12,
"r_y2": 427.58,
"r_x3": 308.86,
"r_y3": 427.58,
"coord_origin": "TOPLEFT"
},
"text": "structure of the table along with the content inserted in the",
"orig": "structure of the table along with the content inserted in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.44,
"r_x1": 545.12,
"r_y1": 448.44,
"r_x2": 545.12,
"r_y2": 439.53,
"r_x3": 308.86,
"r_y3": 439.53,
"coord_origin": "TOPLEFT"
},
"text": "data cell and compared with the ground-truth. Our method",
"orig": "data cell and compared with the ground-truth. Our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 460.39,
"r_x1": 350.24,
"r_y1": 460.39,
"r_x2": 350.24,
"r_y2": 451.49,
"r_x3": 308.86,
"r_y3": 451.49,
"coord_origin": "TOPLEFT"
},
"text": "achieved a",
"orig": "achieved a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.18,
"r_y0": 460.32,
"r_x1": 374.59,
"r_y1": 460.32,
"r_x2": 374.59,
"r_y2": 451.37,
"r_x3": 352.18,
"r_y3": 451.37,
"coord_origin": "TOPLEFT"
},
"text": "5.3%",
"orig": "5.3%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.53,
"r_y0": 460.39,
"r_x1": 545.11,
"r_y1": 460.39,
"r_x2": 545.11,
"r_y2": 451.49,
"r_x3": 376.53,
"r_y3": 451.49,
"coord_origin": "TOPLEFT"
},
"text": "increase over the state-of-the-art, and com-",
"orig": "increase over the state-of-the-art, and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 472.35,
"r_x1": 545.12,
"r_y1": 472.35,
"r_x2": 545.12,
"r_y2": 463.44,
"r_x3": 308.86,
"r_y3": 463.44,
"coord_origin": "TOPLEFT"
},
"text": "mercial solutions. We believe our scores would be higher",
"orig": "mercial solutions. We believe our scores would be higher",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 484.3,
"r_x1": 545.12,
"r_y1": 484.3,
"r_x2": 545.12,
"r_y2": 475.4,
"r_x3": 308.86,
"r_y3": 475.4,
"coord_origin": "TOPLEFT"
},
"text": "if the HTML ground-truth matched the extracted PDF cell",
"orig": "if the HTML ground-truth matched the extracted PDF cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 496.26,
"r_x1": 545.12,
"r_y1": 496.26,
"r_x2": 545.12,
"r_y2": 487.35,
"r_x3": 308.86,
"r_y3": 487.35,
"coord_origin": "TOPLEFT"
},
"text": "content. Unfortunately, there are small discrepancies such",
"orig": "content. Unfortunately, there are small discrepancies such",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 508.21,
"r_x1": 545.12,
"r_y1": 508.21,
"r_x2": 545.12,
"r_y2": 499.31,
"r_x3": 308.86,
"r_y3": 499.31,
"coord_origin": "TOPLEFT"
},
"text": "as spacings around words or special characters with various",
"orig": "as spacings around words or special characters with various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 520.17,
"r_x1": 405.7,
"r_y1": 520.17,
"r_x2": 405.7,
"r_y2": 511.26,
"r_x3": 308.86,
"r_y3": 511.26,
"coord_origin": "TOPLEFT"
},
"text": "unicode representations.",
"orig": "unicode representations.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.77,
"r_x1": 341.74,
"r_y1": 665.77,
"r_x2": 341.74,
"r_y2": 656.86,
"r_x3": 308.86,
"r_y3": 656.86,
"coord_origin": "TOPLEFT"
},
"text": "Table 4:",
"orig": "Table 4:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.56,
"r_y0": 665.77,
"r_x1": 545.12,
"r_y1": 665.77,
"r_x2": 545.12,
"r_y2": 656.86,
"r_x3": 349.56,
"r_y3": 656.86,
"coord_origin": "TOPLEFT"
},
"text": "Results of structure with content retrieved using",
"orig": "Results of structure with content retrieved using",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.72,
"r_x1": 545.12,
"r_y1": 677.72,
"r_x2": 545.12,
"r_y2": 668.82,
"r_x3": 308.86,
"r_y3": 668.82,
"coord_origin": "TOPLEFT"
},
"text": "cell detection on PubTabNet. In all cases the input is PDF",
"orig": "cell detection on PubTabNet. In all cases the input is PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.68,
"r_x1": 435.04,
"r_y1": 689.68,
"r_x2": 435.04,
"r_y2": 680.77,
"r_x3": 308.86,
"r_y3": 680.77,
"coord_origin": "TOPLEFT"
},
"text": "documents with cropped tables.",
"orig": "documents with cropped tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 10,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 74.4,
"r": 167.9,
"b": 84.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.25,
"r_x1": 63.7,
"r_y1": 84.25,
"r_x2": 63.7,
"r_y2": 74.4,
"r_x3": 50.11,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3.",
"orig": "5.3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.77,
"r_y0": 84.25,
"r_x1": 167.9,
"r_y1": 84.25,
"r_x2": 167.9,
"r_y2": 74.4,
"r_x3": 72.77,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "Datasets and Metrics",
"orig": "Datasets and Metrics",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 93.35,
"r": 286.37,
"b": 138.12,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 102.26,
"r_x1": 286.36,
"r_y1": 102.26,
"r_x2": 286.36,
"r_y2": 93.35,
"r_x3": 62.07,
"r_y3": 93.35,
"coord_origin": "TOPLEFT"
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 114.21,
"r_x1": 286.37,
"r_y1": 114.21,
"r_x2": 286.37,
"r_y2": 105.31,
"r_x3": 50.11,
"r_y3": 105.31,
"coord_origin": "TOPLEFT"
},
"text": "ric was introduced in [37]. It represents the prediction, and",
"orig": "ric was introduced in [37]. It represents the prediction, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 126.17,
"r_x1": 286.37,
"r_y1": 126.17,
"r_x2": 286.37,
"r_y2": 117.26,
"r_x3": 50.11,
"r_y3": 117.26,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth as a tree structure of HTML tags. This simi-",
"orig": "ground-truth as a tree structure of HTML tags. This simi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 138.12,
"r_x1": 136.72,
"r_y1": 138.12,
"r_x2": 136.72,
"r_y2": 129.22,
"r_x3": 50.11,
"r_y3": 129.22,
"coord_origin": "TOPLEFT"
},
"text": "larity is calculated as:",
"orig": "larity is calculated as:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "formula",
"bbox": {
"l": 86.22,
"t": 150.32,
"r": 286.36,
"b": 172.74,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.22,
"r_y0": 165.9,
"r_x1": 118.88,
"r_y1": 165.9,
"r_x2": 118.88,
"r_y2": 157.06,
"r_x3": 86.22,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": "TEDS (",
"orig": "TEDS (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.87,
"r_y0": 165.9,
"r_x1": 143.27,
"r_y1": 165.9,
"r_x2": 143.27,
"r_y2": 157.06,
"r_x3": 118.87,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.77,
"r_y0": 165.9,
"r_x1": 165.9,
"r_y1": 165.9,
"r_x2": 165.9,
"r_y2": 157.06,
"r_x3": 143.77,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": ") = 1",
"orig": ") = 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.12,
"r_y0": 165.9,
"r_x1": 175.87,
"r_y1": 165.9,
"r_x2": 175.87,
"r_y2": 156.5,
"r_x3": 168.12,
"r_y3": 156.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 179.28,
"r_y0": 159.16,
"r_x1": 221.96,
"r_y1": 159.16,
"r_x2": 221.96,
"r_y2": 150.32,
"r_x3": 179.28,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": "EditDist (",
"orig": "EditDist (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.95,
"r_y0": 159.16,
"r_x1": 246.35,
"r_y1": 159.16,
"r_x2": 246.35,
"r_y2": 150.32,
"r_x3": 221.95,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.84,
"r_y0": 159.16,
"r_x1": 250.72,
"r_y1": 159.16,
"r_x2": 250.72,
"r_y2": 150.32,
"r_x3": 246.84,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.21,
"r_y0": 172.74,
"r_x1": 206.29,
"r_y1": 172.74,
"r_x2": 206.29,
"r_y2": 163.89,
"r_x3": 182.21,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "max (",
"orig": "max (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.29,
"r_y0": 172.74,
"r_x1": 209.06,
"r_y1": 172.74,
"r_x2": 209.06,
"r_y2": 163.33,
"r_x3": 206.29,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.06,
"r_y0": 172.74,
"r_x1": 219.2,
"r_y1": 172.74,
"r_x2": 219.2,
"r_y2": 163.89,
"r_x3": 209.06,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.7,
"r_y0": 172.74,
"r_x1": 222.46,
"r_y1": 172.74,
"r_x2": 222.46,
"r_y2": 163.33,
"r_x3": 219.7,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.12,
"r_y0": 172.74,
"r_x1": 226.89,
"r_y1": 172.74,
"r_x2": 226.89,
"r_y2": 163.89,
"r_x3": 224.12,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.55,
"r_y0": 172.74,
"r_x1": 231.32,
"r_y1": 172.74,
"r_x2": 231.32,
"r_y2": 163.33,
"r_x3": 228.55,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.32,
"r_y0": 172.74,
"r_x1": 240.65,
"r_y1": 172.74,
"r_x2": 240.65,
"r_y2": 163.89,
"r_x3": 231.32,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.14,
"r_y0": 172.74,
"r_x1": 243.91,
"r_y1": 172.74,
"r_x2": 243.91,
"r_y2": 163.33,
"r_x3": 241.14,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.91,
"r_y0": 172.74,
"r_x1": 247.79,
"r_y1": 172.74,
"r_x2": 247.79,
"r_y2": 163.89,
"r_x3": 243.91,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 166.12,
"r_x1": 286.36,
"r_y1": 166.12,
"r_x2": 286.36,
"r_y2": 157.22,
"r_x3": 274.75,
"r_y3": 157.22,
"coord_origin": "TOPLEFT"
},
"text": "(3)",
"orig": "(3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "text",
"bbox": {
"l": 50.11,
"t": 181.0,
"r": 286.36,
"b": 213.98,
"coord_origin": "TOPLEFT"
},
"confidence": 0.974,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 190.07,
"r_x1": 86.41,
"r_y1": 190.07,
"r_x2": 86.41,
"r_y2": 181.16,
"r_x3": 62.07,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.58,
"r_y0": 189.85,
"r_x1": 98.72,
"r_y1": 189.85,
"r_x2": 98.72,
"r_y2": 181.0,
"r_x3": 88.58,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.4,
"r_y0": 190.07,
"r_x1": 115.78,
"r_y1": 190.07,
"r_x2": 115.78,
"r_y2": 181.16,
"r_x3": 101.4,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.96,
"r_y0": 189.85,
"r_x1": 127.29,
"r_y1": 189.85,
"r_x2": 127.29,
"r_y2": 181.0,
"r_x3": 117.96,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.96,
"r_y0": 190.07,
"r_x1": 286.36,
"r_y1": 190.07,
"r_x2": 286.36,
"r_y2": 181.16,
"r_x3": 129.96,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "represent tables in tree structure HTML",
"orig": "represent tables in tree structure HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 202.02,
"r_x1": 252.78,
"r_y1": 202.02,
"r_x2": 252.78,
"r_y2": 193.12,
"r_x3": 50.11,
"r_y3": 193.12,
"coord_origin": "TOPLEFT"
},
"text": "format. EditDist denotes the tree-edit distance, and",
"orig": "format. EditDist denotes the tree-edit distance, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.18,
"r_y0": 201.8,
"r_x1": 257.95,
"r_y1": 201.8,
"r_x2": 257.95,
"r_y2": 192.4,
"r_x3": 255.18,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 257.95,
"r_y0": 201.8,
"r_x1": 263.77,
"r_y1": 201.8,
"r_x2": 263.77,
"r_y2": 192.96,
"r_x3": 257.95,
"r_y3": 192.96,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 265.15,
"r_y0": 201.8,
"r_x1": 267.92,
"r_y1": 201.8,
"r_x2": 267.92,
"r_y2": 192.4,
"r_x3": 265.15,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.32,
"r_y0": 202.02,
"r_x1": 286.36,
"r_y1": 202.02,
"r_x2": 286.36,
"r_y2": 193.12,
"r_x3": 270.32,
"r_y3": 193.12,
"coord_origin": "TOPLEFT"
},
"text": "rep-",
"orig": "rep-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 213.98,
"r_x1": 172.13,
"r_y1": 213.98,
"r_x2": 172.13,
"r_y2": 205.07,
"r_x3": 50.11,
"r_y3": 205.07,
"coord_origin": "TOPLEFT"
},
"text": "resents the number of nodes in",
"orig": "resents the number of nodes in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.62,
"r_y0": 213.76,
"r_x1": 180.45,
"r_y1": 213.76,
"r_x2": 180.45,
"r_y2": 204.91,
"r_x3": 174.62,
"r_y3": 204.91,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.83,
"r_y0": 213.98,
"r_x1": 184.32,
"r_y1": 213.98,
"r_x2": 184.32,
"r_y2": 205.07,
"r_x3": 181.83,
"r_y3": 205.07,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 224.82,
"r": 170.45,
"b": 234.67,
"coord_origin": "TOPLEFT"
},
"confidence": 0.959,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 234.67,
"r_x1": 64.55,
"r_y1": 234.67,
"r_x2": 64.55,
"r_y2": 224.82,
"r_x3": 50.11,
"r_y3": 224.82,
"coord_origin": "TOPLEFT"
},
"text": "5.4.",
"orig": "5.4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.18,
"r_y0": 234.67,
"r_x1": 170.45,
"r_y1": 234.67,
"r_x2": 170.45,
"r_y2": 224.82,
"r_x3": 74.18,
"r_y3": 224.82,
"coord_origin": "TOPLEFT"
},
"text": "Quantitative Analysis",
"orig": "Quantitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 243.65,
"r": 286.37,
"b": 396.14,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 252.61,
"r_x1": 105.32,
"r_y1": 252.61,
"r_x2": 105.32,
"r_y2": 243.65,
"r_x3": 62.07,
"r_y3": 243.65,
"coord_origin": "TOPLEFT"
},
"text": "Structure.",
"orig": "Structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.13,
"r_y0": 252.68,
"r_x1": 184.68,
"r_y1": 252.68,
"r_x2": 184.68,
"r_y2": 243.77,
"r_x3": 112.13,
"r_y3": 243.77,
"coord_origin": "TOPLEFT"
},
"text": "As shown in Tab.",
"orig": "As shown in Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 191.48,
"r_y0": 252.68,
"r_x1": 286.36,
"r_y1": 252.68,
"r_x2": 286.36,
"r_y2": 243.77,
"r_x3": 191.48,
"r_y3": 243.77,
"coord_origin": "TOPLEFT"
},
"text": "2, TableFormer outper-",
"orig": "2, TableFormer outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.63,
"r_x1": 286.37,
"r_y1": 264.63,
"r_x2": 286.37,
"r_y2": 255.72,
"r_x3": 50.11,
"r_y3": 255.72,
"coord_origin": "TOPLEFT"
},
"text": "forms all SOTA methods across different datasets by a large",
"orig": "forms all SOTA methods across different datasets by a large",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.59,
"r_x1": 286.37,
"r_y1": 276.59,
"r_x2": 286.37,
"r_y2": 267.68,
"r_x3": 50.11,
"r_y3": 267.68,
"coord_origin": "TOPLEFT"
},
"text": "margin for predicting the table structure from an image.",
"orig": "margin for predicting the table structure from an image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.54,
"r_x1": 286.37,
"r_y1": 288.54,
"r_x2": 286.37,
"r_y2": 279.63,
"r_x3": 50.11,
"r_y3": 279.63,
"coord_origin": "TOPLEFT"
},
"text": "All the more, our model outperforms pre-trained methods.",
"orig": "All the more, our model outperforms pre-trained methods.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.5,
"r_x1": 286.37,
"r_y1": 300.5,
"r_x2": 286.37,
"r_y2": 291.59,
"r_x3": 50.11,
"r_y3": 291.59,
"coord_origin": "TOPLEFT"
},
"text": "During the evaluation we do not apply any table filtering.",
"orig": "During the evaluation we do not apply any table filtering.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.45,
"r_x1": 286.37,
"r_y1": 312.45,
"r_x2": 286.37,
"r_y2": 303.55,
"r_x3": 50.11,
"r_y3": 303.55,
"coord_origin": "TOPLEFT"
},
"text": "We also provide our baseline results on the SynthTabNet",
"orig": "We also provide our baseline results on the SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.41,
"r_x1": 286.37,
"r_y1": 324.41,
"r_x2": 286.37,
"r_y2": 315.5,
"r_x3": 50.11,
"r_y3": 315.5,
"coord_origin": "TOPLEFT"
},
"text": "dataset. It has been observed that large tables (e.g. tables",
"orig": "dataset. It has been observed that large tables (e.g. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.36,
"r_x1": 286.37,
"r_y1": 336.36,
"r_x2": 286.37,
"r_y2": 327.46,
"r_x3": 50.11,
"r_y3": 327.46,
"coord_origin": "TOPLEFT"
},
"text": "that occupy half of the page or more) yield poor predictions.",
"orig": "that occupy half of the page or more) yield poor predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.32,
"r_x1": 286.37,
"r_y1": 348.32,
"r_x2": 286.37,
"r_y2": 339.41,
"r_x3": 50.11,
"r_y3": 339.41,
"coord_origin": "TOPLEFT"
},
"text": "We attribute this issue to the image resizing during the pre-",
"orig": "We attribute this issue to the image resizing during the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 360.27,
"r_x1": 286.37,
"r_y1": 360.27,
"r_x2": 286.37,
"r_y2": 351.37,
"r_x3": 50.11,
"r_y3": 351.37,
"coord_origin": "TOPLEFT"
},
"text": "processing step, that produces downsampled images with",
"orig": "processing step, that produces downsampled images with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 372.23,
"r_x1": 286.37,
"r_y1": 372.23,
"r_x2": 286.37,
"r_y2": 363.32,
"r_x3": 50.11,
"r_y3": 363.32,
"coord_origin": "TOPLEFT"
},
"text": "indistinguishable features. This problem can be addressed",
"orig": "indistinguishable features. This problem can be addressed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 384.18,
"r_x1": 286.37,
"r_y1": 384.18,
"r_x2": 286.37,
"r_y2": 375.28,
"r_x3": 50.11,
"r_y3": 375.28,
"coord_origin": "TOPLEFT"
},
"text": "by treating such big tables with a separate model which ac-",
"orig": "by treating such big tables with a separate model which ac-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.14,
"r_x1": 170.01,
"r_y1": 396.14,
"r_x2": 170.01,
"r_y2": 387.23,
"r_x3": 50.11,
"r_y3": 387.23,
"coord_origin": "TOPLEFT"
},
"text": "cepts a large input image size.",
"orig": "cepts a large input image size.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "table",
"bbox": {
"l": 53.37,
"t": 409.14,
"r": 283.04,
"b": 582.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.989,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 27,
"label": "text",
"bbox": {
"l": 78.84,
"t": 420.69,
"r": 104.86,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 211.2,
"t": 414.71,
"r": 236.11,
"b": 423.62,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 129.34,
"t": 426.67,
"r": 159.22,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 171.17,
"t": 426.67,
"r": 199.4,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 211.36,
"t": 426.67,
"r": 247.74,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 264.54,
"t": 426.67,
"r": 277.27,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 81.61,
"t": 443.62,
"r": 102.09,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 134.87,
"t": 443.62,
"r": 153.69,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 176.57,
"t": 443.62,
"r": 194.0,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 220.83,
"t": 443.62,
"r": 238.26,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 262.18,
"t": 443.62,
"r": 279.62,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 82.17,
"t": 455.58,
"r": 101.53,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 134.87,
"t": 455.58,
"r": 153.69,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 183.62,
"t": 455.58,
"r": 186.94,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 227.89,
"t": 455.58,
"r": 231.21,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 259.7,
"t": 455.58,
"r": 282.11,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 66.32,
"t": 468.13,
"r": 117.38,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 134.87,
"t": 468.13,
"r": 153.69,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 176.57,
"t": 468.13,
"r": 194.01,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 220.83,
"t": 468.13,
"r": 238.27,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 259.7,
"t": 468.01,
"r": 282.11,
"b": 476.97,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 81.61,
"t": 483.33,
"r": 102.09,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 134.87,
"t": 483.33,
"r": 153.69,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 176.57,
"t": 483.33,
"r": 194.0,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 218.34,
"t": 483.33,
"r": 240.75,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 262.18,
"t": 483.33,
"r": 279.62,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 82.17,
"t": 495.28,
"r": 101.53,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 134.87,
"t": 495.28,
"r": 153.69,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 183.62,
"t": 495.28,
"r": 186.94,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 227.89,
"t": 495.28,
"r": 231.21,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 259.7,
"t": 495.28,
"r": 282.11,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 71.79,
"t": 507.24,
"r": 111.91,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 134.86,
"t": 507.24,
"r": 153.68,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 183.63,
"t": 507.24,
"r": 186.95,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 227.89,
"t": 507.24,
"r": 231.21,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 259.69,
"t": 507.24,
"r": 282.11,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 66.32,
"t": 519.19,
"r": 117.38,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 134.87,
"t": 519.19,
"r": 153.69,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 176.57,
"t": 519.19,
"r": 194.01,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 220.83,
"t": 519.19,
"r": 238.27,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 262.19,
"t": 519.07,
"r": 279.62,
"b": 528.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 81.61,
"t": 536.5,
"r": 102.09,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 137.91,
"t": 536.5,
"r": 150.64,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 176.57,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 227.89,
"t": 536.5,
"r": 231.21,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 262.18,
"t": 536.5,
"r": 279.62,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 66.32,
"t": 548.45,
"r": 117.38,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 137.91,
"t": 548.45,
"r": 150.64,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 176.57,
"t": 548.45,
"r": 194.01,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 227.89,
"t": 548.45,
"r": 231.21,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 262.19,
"t": 548.33,
"r": 279.62,
"b": 557.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 66.32,
"t": 568.0,
"r": 117.38,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 134.87,
"t": 568.0,
"r": 153.69,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 176.57,
"t": 568.0,
"r": 194.01,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 220.83,
"t": 568.0,
"r": 238.27,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 262.19,
"t": 568.0,
"r": 279.62,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 15,
"label": "text",
"bbox": {
"l": 50.11,
"t": 592.43,
"r": 286.37,
"b": 613.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.721,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 601.34,
"r_x1": 286.37,
"r_y1": 601.34,
"r_x2": 286.37,
"r_y2": 592.43,
"r_x3": 50.11,
"r_y3": 592.43,
"coord_origin": "TOPLEFT"
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 613.29,
"r_x1": 247.46,
"r_y1": 613.29,
"r_x2": 247.46,
"r_y2": 604.39,
"r_x3": 50.11,
"r_y3": 604.39,
"coord_origin": "TOPLEFT"
},
"text": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"orig": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 50.11,
"t": 616.34,
"r": 261.79,
"b": 625.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.643,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 625.25,
"r_x1": 261.79,
"r_y1": 625.25,
"r_x2": 261.79,
"r_y2": 616.34,
"r_x3": 50.11,
"r_y3": 616.34,
"coord_origin": "TOPLEFT"
},
"text": "FT: Model was trained on PubTabNet then finetuned.",
"orig": "FT: Model was trained on PubTabNet then finetuned.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 644.35,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 653.31,
"r_x1": 124.72,
"r_y1": 653.31,
"r_x2": 124.72,
"r_y2": 644.35,
"r_x3": 62.07,
"r_y3": 644.35,
"coord_origin": "TOPLEFT"
},
"text": "Cell Detection.",
"orig": "Cell Detection.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.2,
"r_y0": 653.38,
"r_x1": 242.93,
"r_y1": 653.38,
"r_x2": 242.93,
"r_y2": 644.47,
"r_x3": 128.2,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "Like any object detector, our",
"orig": "Like any object detector, our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.55,
"r_y0": 653.15,
"r_x1": 286.36,
"r_y1": 653.15,
"r_x2": 286.36,
"r_y2": 644.56,
"r_x3": 245.55,
"r_y3": 644.56,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.1,
"r_x1": 84.97,
"r_y1": 665.1,
"r_x2": 84.97,
"r_y2": 656.51,
"r_x3": 50.11,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "Detector",
"orig": "Detector",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.52,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 89.52,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "provides bounding boxes that can be improved",
"orig": "provides bounding boxes that can be improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "with post-processing during inference. We make use of the",
"orig": "with post-processing during inference. We make use of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "grid-like structure of tables to refine the predictions. A de-",
"orig": "grid-like structure of tables to refine the predictions. A de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "tailed explanation on the post-processing is available in the",
"orig": "tailed explanation on the post-processing is available in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "supplementary material. As shown in Tab. 3, we evaluate",
"orig": "supplementary material. As shown in Tab. 3, we evaluate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 227.58,
"coord_origin": "TOPLEFT"
},
"confidence": 0.971,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 322.14,
"r_y1": 84.11,
"r_x2": 322.14,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "our",
"orig": "our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.45,
"r_y0": 83.89,
"r_x1": 404.57,
"r_y1": 83.89,
"r_x2": 404.57,
"r_y2": 75.3,
"r_x3": 325.45,
"r_y3": 75.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 84.11,
"r_x1": 545.11,
"r_y1": 84.11,
"r_x2": 545.11,
"r_y2": 75.21,
"r_x3": 408.1,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "accuracy for cells with a class la-",
"orig": "accuracy for cells with a class la-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 470.23,
"r_y1": 108.02,
"r_x2": 470.23,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "for pre-processing and post-processing.",
"orig": "for pre-processing and post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.53,
"r_y0": 108.02,
"r_x1": 545.12,
"r_y1": 108.02,
"r_x2": 545.12,
"r_y2": 99.12,
"r_x3": 477.53,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "Note that we do",
"orig": "Note that we do",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 119.98,
"r_x1": 545.12,
"r_y1": 119.98,
"r_x2": 545.12,
"r_y2": 111.07,
"r_x3": 308.86,
"r_y3": 111.07,
"coord_origin": "TOPLEFT"
},
"text": "not have post-processing results for SynthTabNet as images",
"orig": "not have post-processing results for SynthTabNet as images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 131.93,
"r_x1": 545.12,
"r_y1": 131.93,
"r_x2": 545.12,
"r_y2": 123.03,
"r_x3": 308.86,
"r_y3": 123.03,
"coord_origin": "TOPLEFT"
},
"text": "are only provided. To compare the performance of our pro-",
"orig": "are only provided. To compare the performance of our pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 143.89,
"r_x1": 502.02,
"r_y1": 143.89,
"r_x2": 502.02,
"r_y2": 134.98,
"r_x3": 308.86,
"r_y3": 134.98,
"coord_origin": "TOPLEFT"
},
"text": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"orig": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 504.47,
"r_y0": 143.66,
"r_x1": 545.11,
"r_y1": 143.66,
"r_x2": 545.11,
"r_y2": 135.07,
"r_x3": 504.47,
"r_y3": 135.07,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 155.62,
"r_x1": 343.16,
"r_y1": 155.62,
"r_x2": 343.16,
"r_y2": 147.03,
"r_x3": 308.86,
"r_y3": 147.03,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.37,
"r_y0": 155.85,
"r_x1": 545.11,
"r_y1": 155.85,
"r_x2": 545.11,
"r_y2": 146.94,
"r_x3": 346.37,
"r_y3": 146.94,
"coord_origin": "TOPLEFT"
},
"text": "into EDD architecture. As mentioned previously,",
"orig": "into EDD architecture. As mentioned previously,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 167.8,
"r_x1": 446.16,
"r_y1": 167.8,
"r_x2": 446.16,
"r_y2": 158.89,
"r_x3": 308.86,
"r_y3": 158.89,
"coord_origin": "TOPLEFT"
},
"text": "the Structure Decoder provides the",
"orig": "the Structure Decoder provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.29,
"r_y0": 167.57,
"r_x1": 525.04,
"r_y1": 167.57,
"r_x2": 525.04,
"r_y2": 158.98,
"r_x3": 448.29,
"r_y3": 158.98,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.4,
"r_y0": 167.8,
"r_x1": 545.11,
"r_y1": 167.8,
"r_x2": 545.11,
"r_y2": 158.89,
"r_x3": 527.4,
"r_y3": 158.89,
"coord_origin": "TOPLEFT"
},
"text": "with",
"orig": "with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 179.76,
"r_x1": 545.12,
"r_y1": 179.76,
"r_x2": 545.12,
"r_y2": 170.85,
"r_x3": 308.86,
"r_y3": 170.85,
"coord_origin": "TOPLEFT"
},
"text": "the features needed to predict the bounding box predictions.",
"orig": "the features needed to predict the bounding box predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 191.71,
"r_x1": 432.87,
"r_y1": 191.71,
"r_x2": 432.87,
"r_y2": 182.8,
"r_x3": 308.86,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "Therefore, the accuracy of the",
"orig": "Therefore, the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.39,
"r_y0": 191.48,
"r_x1": 510.93,
"r_y1": 191.48,
"r_x2": 510.93,
"r_y2": 182.89,
"r_x3": 436.39,
"r_y3": 182.89,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.68,
"r_y0": 191.71,
"r_x1": 545.11,
"r_y1": 191.71,
"r_x2": 545.11,
"r_y2": 182.8,
"r_x3": 514.68,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "directly",
"orig": "directly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 203.67,
"r_x1": 431.17,
"r_y1": 203.67,
"r_x2": 431.17,
"r_y2": 194.76,
"r_x3": 308.86,
"r_y3": 194.76,
"coord_origin": "TOPLEFT"
},
"text": "influences the accuracy of the",
"orig": "influences the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.68,
"r_y0": 203.44,
"r_x1": 514.18,
"r_y1": 203.44,
"r_x2": 514.18,
"r_y2": 194.85,
"r_x3": 434.68,
"r_y3": 194.85,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.18,
"r_y0": 203.67,
"r_x1": 545.11,
"r_y1": 203.67,
"r_x2": 545.11,
"r_y2": 194.76,
"r_x3": 514.18,
"r_y3": 194.76,
"coord_origin": "TOPLEFT"
},
"text": ". If the",
"orig": ". If the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 215.39,
"r_x1": 382.36,
"r_y1": 215.39,
"r_x2": 382.36,
"r_y2": 206.81,
"r_x3": 308.86,
"r_y3": 206.81,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.08,
"r_y0": 215.62,
"r_x1": 545.11,
"r_y1": 215.62,
"r_x2": 545.11,
"r_y2": 206.72,
"r_x3": 385.08,
"r_y3": 206.72,
"coord_origin": "TOPLEFT"
},
"text": "predicts an extra column, this will result",
"orig": "predicts an extra column, this will result",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 227.58,
"r_x1": 501.7,
"r_y1": 227.58,
"r_x2": 501.7,
"r_y2": 218.67,
"r_x3": 308.86,
"r_y3": 218.67,
"coord_origin": "TOPLEFT"
},
"text": "in an extra column of predicted bounding boxes.",
"orig": "in an extra column of predicted bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 308.41,
"t": 247.88,
"r": 533.64,
"b": 303.81,
"coord_origin": "TOPLEFT"
},
"confidence": 0.969,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 339.32,
"t": 253.66,
"r": 365.34,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 401.04,
"t": 253.66,
"r": 430.92,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 454.1,
"t": 253.66,
"r": 474.59,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 486.54,
"t": 253.66,
"r": 527.23,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 327.66,
"t": 270.62,
"r": 377.0,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 393.7,
"t": 270.62,
"r": 438.28,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 455.64,
"t": 270.62,
"r": 473.07,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 498.17,
"t": 270.62,
"r": 515.6,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.8,
"t": 282.58,
"r": 377.86,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 393.69,
"t": 282.58,
"r": 438.28,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 455.63,
"t": 282.46,
"r": 473.07,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 498.17,
"t": 282.46,
"r": 515.61,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 326.8,
"t": 294.53,
"r": 377.86,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 389.82,
"t": 294.53,
"r": 442.15,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 455.63,
"t": 294.53,
"r": 473.07,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 505.23,
"t": 294.53,
"r": 508.54,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 12,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 316.45,
"r": 545.12,
"b": 337.31,
"coord_origin": "TOPLEFT"
},
"confidence": 0.952,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 325.36,
"r_x1": 341.5,
"r_y1": 325.36,
"r_x2": 341.5,
"r_y2": 316.45,
"r_x3": 308.86,
"r_y3": 316.45,
"coord_origin": "TOPLEFT"
},
"text": "Table 3:",
"orig": "Table 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.6,
"r_y0": 325.36,
"r_x1": 545.12,
"r_y1": 325.36,
"r_x2": 545.12,
"r_y2": 316.45,
"r_x3": 348.6,
"r_y3": 316.45,
"coord_origin": "TOPLEFT"
},
"text": "Cell Bounding Box detection results on PubTab-",
"orig": "Cell Bounding Box detection results on PubTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 337.31,
"r_x1": 474.98,
"r_y1": 337.31,
"r_x2": 474.98,
"r_y2": 328.4,
"r_x3": 308.86,
"r_y3": 328.4,
"coord_origin": "TOPLEFT"
},
"text": "Net, and FinTabNet. PP: Post-processing.",
"orig": "Net, and FinTabNet. PP: Post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 308.86,
"t": 367.68,
"r": 545.12,
"b": 520.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 376.64,
"r_x1": 378.95,
"r_y1": 376.64,
"r_x2": 378.95,
"r_y2": 367.68,
"r_x3": 320.82,
"r_y3": 367.68,
"coord_origin": "TOPLEFT"
},
"text": "Cell Content.",
"orig": "Cell Content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 387.08,
"r_y0": 376.71,
"r_x1": 545.12,
"r_y1": 376.71,
"r_x2": 545.12,
"r_y2": 367.8,
"r_x3": 387.08,
"r_y3": 367.8,
"coord_origin": "TOPLEFT"
},
"text": "In this section, we evaluate the entire",
"orig": "In this section, we evaluate the entire",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 388.66,
"r_x1": 487.19,
"r_y1": 388.66,
"r_x2": 487.19,
"r_y2": 379.75,
"r_x3": 308.86,
"r_y3": 379.75,
"coord_origin": "TOPLEFT"
},
"text": "pipeline of recovering a table with content.",
"orig": "pipeline of recovering a table with content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.97,
"r_y0": 388.66,
"r_x1": 545.12,
"r_y1": 388.66,
"r_x2": 545.12,
"r_y2": 379.75,
"r_x3": 493.97,
"r_y3": 379.75,
"coord_origin": "TOPLEFT"
},
"text": "Here we put",
"orig": "Here we put",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.62,
"r_x1": 545.12,
"r_y1": 400.62,
"r_x2": 545.12,
"r_y2": 391.71,
"r_x3": 308.86,
"r_y3": 391.71,
"coord_origin": "TOPLEFT"
},
"text": "our approach to test by capitalizing on extracting content",
"orig": "our approach to test by capitalizing on extracting content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.57,
"r_x1": 545.12,
"r_y1": 412.57,
"r_x2": 545.12,
"r_y2": 403.67,
"r_x3": 308.86,
"r_y3": 403.67,
"coord_origin": "TOPLEFT"
},
"text": "from the PDF cells rather than decoding from images. Tab.",
"orig": "from the PDF cells rather than decoding from images. Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.53,
"r_x1": 314.08,
"r_y1": 424.53,
"r_x2": 314.08,
"r_y2": 415.62,
"r_x3": 308.86,
"r_y3": 415.62,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.69,
"r_y0": 424.53,
"r_x1": 545.12,
"r_y1": 424.53,
"r_x2": 545.12,
"r_y2": 415.62,
"r_x3": 316.69,
"r_y3": 415.62,
"coord_origin": "TOPLEFT"
},
"text": "shows the TEDs score of HTML code representing the",
"orig": "shows the TEDs score of HTML code representing the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.48,
"r_x1": 545.12,
"r_y1": 436.48,
"r_x2": 545.12,
"r_y2": 427.58,
"r_x3": 308.86,
"r_y3": 427.58,
"coord_origin": "TOPLEFT"
},
"text": "structure of the table along with the content inserted in the",
"orig": "structure of the table along with the content inserted in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.44,
"r_x1": 545.12,
"r_y1": 448.44,
"r_x2": 545.12,
"r_y2": 439.53,
"r_x3": 308.86,
"r_y3": 439.53,
"coord_origin": "TOPLEFT"
},
"text": "data cell and compared with the ground-truth. Our method",
"orig": "data cell and compared with the ground-truth. Our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 460.39,
"r_x1": 350.24,
"r_y1": 460.39,
"r_x2": 350.24,
"r_y2": 451.49,
"r_x3": 308.86,
"r_y3": 451.49,
"coord_origin": "TOPLEFT"
},
"text": "achieved a",
"orig": "achieved a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.18,
"r_y0": 460.32,
"r_x1": 374.59,
"r_y1": 460.32,
"r_x2": 374.59,
"r_y2": 451.37,
"r_x3": 352.18,
"r_y3": 451.37,
"coord_origin": "TOPLEFT"
},
"text": "5.3%",
"orig": "5.3%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.53,
"r_y0": 460.39,
"r_x1": 545.11,
"r_y1": 460.39,
"r_x2": 545.11,
"r_y2": 451.49,
"r_x3": 376.53,
"r_y3": 451.49,
"coord_origin": "TOPLEFT"
},
"text": "increase over the state-of-the-art, and com-",
"orig": "increase over the state-of-the-art, and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 472.35,
"r_x1": 545.12,
"r_y1": 472.35,
"r_x2": 545.12,
"r_y2": 463.44,
"r_x3": 308.86,
"r_y3": 463.44,
"coord_origin": "TOPLEFT"
},
"text": "mercial solutions. We believe our scores would be higher",
"orig": "mercial solutions. We believe our scores would be higher",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 484.3,
"r_x1": 545.12,
"r_y1": 484.3,
"r_x2": 545.12,
"r_y2": 475.4,
"r_x3": 308.86,
"r_y3": 475.4,
"coord_origin": "TOPLEFT"
},
"text": "if the HTML ground-truth matched the extracted PDF cell",
"orig": "if the HTML ground-truth matched the extracted PDF cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 496.26,
"r_x1": 545.12,
"r_y1": 496.26,
"r_x2": 545.12,
"r_y2": 487.35,
"r_x3": 308.86,
"r_y3": 487.35,
"coord_origin": "TOPLEFT"
},
"text": "content. Unfortunately, there are small discrepancies such",
"orig": "content. Unfortunately, there are small discrepancies such",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 508.21,
"r_x1": 545.12,
"r_y1": 508.21,
"r_x2": 545.12,
"r_y2": 499.31,
"r_x3": 308.86,
"r_y3": 499.31,
"coord_origin": "TOPLEFT"
},
"text": "as spacings around words or special characters with various",
"orig": "as spacings around words or special characters with various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 520.17,
"r_x1": 405.7,
"r_y1": 520.17,
"r_x2": 405.7,
"r_y2": 511.26,
"r_x3": 308.86,
"r_y3": 511.26,
"coord_origin": "TOPLEFT"
},
"text": "unicode representations.",
"orig": "unicode representations.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "table",
"bbox": {
"l": 332.97,
"t": 540.28,
"r": 520.94,
"b": 643.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 99,
"label": "text",
"bbox": {
"l": 358.01,
"t": 552.23,
"r": 384.02,
"b": 561.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 449.03,
"t": 546.26,
"r": 473.94,
"b": 555.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 408.51,
"t": 558.21,
"r": 436.74,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 448.7,
"t": 558.21,
"r": 485.08,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 499.38,
"t": 558.21,
"r": 512.12,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 357.68,
"t": 575.17,
"r": 384.35,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 413.9,
"t": 575.17,
"r": 431.34,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 458.16,
"t": 575.17,
"r": 475.6,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 497.03,
"t": 575.17,
"r": 514.46,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 350.72,
"t": 587.12,
"r": 391.31,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 413.91,
"t": 587.12,
"r": 431.34,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 458.17,
"t": 587.12,
"r": 475.6,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 497.03,
"t": 587.12,
"r": 514.47,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 354.14,
"t": 599.08,
"r": 387.9,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 413.9,
"t": 599.08,
"r": 431.34,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 458.17,
"t": 599.08,
"r": 475.6,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 497.03,
"t": 599.08,
"r": 514.46,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 346.56,
"t": 611.03,
"r": 395.48,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 413.91,
"t": 611.03,
"r": 431.34,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 458.17,
"t": 611.03,
"r": 475.6,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 497.03,
"t": 611.03,
"r": 514.47,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 360.78,
"t": 622.99,
"r": 381.25,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 413.9,
"t": 622.99,
"r": 431.34,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 458.17,
"t": 622.99,
"r": 475.6,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 497.03,
"t": 622.99,
"r": 514.46,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 345.48,
"t": 634.94,
"r": 396.55,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 125,
"label": "text",
"bbox": {
"l": 413.91,
"t": 634.94,
"r": 431.34,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 458.17,
"t": 634.94,
"r": 475.6,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 497.03,
"t": 634.82,
"r": 514.47,
"b": 643.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 11,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 656.86,
"r": 545.12,
"b": 689.68,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.77,
"r_x1": 341.74,
"r_y1": 665.77,
"r_x2": 341.74,
"r_y2": 656.86,
"r_x3": 308.86,
"r_y3": 656.86,
"coord_origin": "TOPLEFT"
},
"text": "Table 4:",
"orig": "Table 4:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.56,
"r_y0": 665.77,
"r_x1": 545.12,
"r_y1": 665.77,
"r_x2": 545.12,
"r_y2": 656.86,
"r_x3": 349.56,
"r_y3": 656.86,
"coord_origin": "TOPLEFT"
},
"text": "Results of structure with content retrieved using",
"orig": "Results of structure with content retrieved using",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.72,
"r_x1": 545.12,
"r_y1": 677.72,
"r_x2": 545.12,
"r_y2": 668.82,
"r_x3": 308.86,
"r_y3": 668.82,
"coord_origin": "TOPLEFT"
},
"text": "cell detection on PubTabNet. In all cases the input is PDF",
"orig": "cell detection on PubTabNet. In all cases the input is PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.68,
"r_x1": 435.04,
"r_y1": 689.68,
"r_x2": 435.04,
"r_y2": 680.77,
"r_x3": 308.86,
"r_y3": 680.77,
"coord_origin": "TOPLEFT"
},
"text": "documents with cropped tables.",
"orig": "documents with cropped tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.879,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"0": {
"label": "table",
"id": 0,
"page_no": 6,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 53.37,
"t": 409.14,
"r": 283.04,
"b": 582.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.989,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 27,
"label": "text",
"bbox": {
"l": 78.84,
"t": 420.69,
"r": 104.86,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 211.2,
"t": 414.71,
"r": 236.11,
"b": 423.62,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 129.34,
"t": 426.67,
"r": 159.22,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 171.17,
"t": 426.67,
"r": 199.4,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 211.36,
"t": 426.67,
"r": 247.74,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 264.54,
"t": 426.67,
"r": 277.27,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 81.61,
"t": 443.62,
"r": 102.09,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 134.87,
"t": 443.62,
"r": 153.69,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 176.57,
"t": 443.62,
"r": 194.0,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 220.83,
"t": 443.62,
"r": 238.26,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 262.18,
"t": 443.62,
"r": 279.62,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 82.17,
"t": 455.58,
"r": 101.53,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 134.87,
"t": 455.58,
"r": 153.69,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 183.62,
"t": 455.58,
"r": 186.94,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 227.89,
"t": 455.58,
"r": 231.21,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 259.7,
"t": 455.58,
"r": 282.11,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 66.32,
"t": 468.13,
"r": 117.38,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 134.87,
"t": 468.13,
"r": 153.69,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 176.57,
"t": 468.13,
"r": 194.01,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 220.83,
"t": 468.13,
"r": 238.27,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 259.7,
"t": 468.01,
"r": 282.11,
"b": 476.97,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 81.61,
"t": 483.33,
"r": 102.09,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 134.87,
"t": 483.33,
"r": 153.69,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 176.57,
"t": 483.33,
"r": 194.0,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 218.34,
"t": 483.33,
"r": 240.75,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 262.18,
"t": 483.33,
"r": 279.62,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 82.17,
"t": 495.28,
"r": 101.53,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 134.87,
"t": 495.28,
"r": 153.69,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 183.62,
"t": 495.28,
"r": 186.94,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 227.89,
"t": 495.28,
"r": 231.21,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 259.7,
"t": 495.28,
"r": 282.11,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 71.79,
"t": 507.24,
"r": 111.91,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 134.86,
"t": 507.24,
"r": 153.68,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 183.63,
"t": 507.24,
"r": 186.95,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 227.89,
"t": 507.24,
"r": 231.21,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 259.69,
"t": 507.24,
"r": 282.11,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 66.32,
"t": 519.19,
"r": 117.38,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 134.87,
"t": 519.19,
"r": 153.69,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 176.57,
"t": 519.19,
"r": 194.01,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 220.83,
"t": 519.19,
"r": 238.27,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 262.19,
"t": 519.07,
"r": 279.62,
"b": 528.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 81.61,
"t": 536.5,
"r": 102.09,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 137.91,
"t": 536.5,
"r": 150.64,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 176.57,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 227.89,
"t": 536.5,
"r": 231.21,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 262.18,
"t": 536.5,
"r": 279.62,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 66.32,
"t": 548.45,
"r": 117.38,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 137.91,
"t": 548.45,
"r": 150.64,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 176.57,
"t": 548.45,
"r": 194.01,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 227.89,
"t": 548.45,
"r": 231.21,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 262.19,
"t": 548.33,
"r": 279.62,
"b": 557.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 66.32,
"t": 568.0,
"r": 117.38,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 134.87,
"t": 568.0,
"r": 153.69,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 176.57,
"t": 568.0,
"r": 194.01,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 220.83,
"t": 568.0,
"r": 238.27,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 262.19,
"t": 568.0,
"r": 279.62,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 11,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 78.84,
"t": 420.69,
"r": 104.86,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 211.2,
"t": 414.71,
"r": 236.11,
"b": 423.62,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 129.34,
"t": 426.67,
"r": 159.22,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 171.17,
"t": 426.67,
"r": 199.4,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 264.54,
"t": 426.67,
"r": 277.27,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 443.62,
"r": 102.09,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 443.62,
"r": 153.69,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 443.62,
"r": 194.0,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "91.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 443.62,
"r": 238.26,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 443.62,
"r": 279.62,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.17,
"t": 455.58,
"r": 101.53,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 455.58,
"r": 153.69,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.62,
"t": 455.58,
"r": 186.94,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 455.58,
"r": 231.21,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 455.58,
"r": 282.11,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "93.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 468.13,
"r": 117.38,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 468.13,
"r": 153.69,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 468.13,
"r": 194.01,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "98.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 468.13,
"r": 238.27,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 468.01,
"r": 282.11,
"b": 476.97,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.75",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 483.33,
"r": 102.09,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 483.33,
"r": 153.69,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 483.33,
"r": 194.0,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "88.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 218.34,
"t": 483.33,
"r": 240.75,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "92.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 483.33,
"r": 279.62,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "90.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.17,
"t": 495.28,
"r": 101.53,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 495.28,
"r": 153.69,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.62,
"t": 495.28,
"r": 186.94,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 495.28,
"r": 231.21,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 495.28,
"r": 282.11,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "87.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 71.79,
"t": 507.24,
"r": 111.91,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE (FT)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.86,
"t": 507.24,
"r": 153.68,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.63,
"t": 507.24,
"r": 186.95,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 507.24,
"r": 231.21,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.69,
"t": 507.24,
"r": 282.11,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "91.02",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 519.19,
"r": 117.38,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 519.19,
"r": 153.69,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 519.19,
"r": 194.01,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "97.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 519.19,
"r": 238.27,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 519.07,
"r": 279.62,
"b": 528.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 536.5,
"r": 102.09,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.91,
"t": 536.5,
"r": 150.64,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 536.5,
"r": 231.21,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 536.5,
"r": 279.62,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 548.45,
"r": 117.38,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.91,
"t": 548.45,
"r": 150.64,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 548.45,
"r": 194.01,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 548.45,
"r": 231.21,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 548.33,
"r": 279.62,
"b": 557.29,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 568.0,
"r": 117.38,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 568.0,
"r": 153.69,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "STN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 568.0,
"r": 194.01,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "96.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 568.0,
"r": 238.27,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 568.0,
"r": 279.62,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.7",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
"8": {
"label": "table",
"id": 8,
"page_no": 6,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 308.41,
"t": 247.88,
"r": 533.64,
"b": 303.81,
"coord_origin": "TOPLEFT"
},
"confidence": 0.969,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 339.32,
"t": 253.66,
"r": 365.34,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 401.04,
"t": 253.66,
"r": 430.92,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 454.1,
"t": 253.66,
"r": 474.59,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 486.54,
"t": 253.66,
"r": 527.23,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 327.66,
"t": 270.62,
"r": 377.0,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 393.7,
"t": 270.62,
"r": 438.28,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 455.64,
"t": 270.62,
"r": 473.07,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 498.17,
"t": 270.62,
"r": 515.6,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.8,
"t": 282.58,
"r": 377.86,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 393.69,
"t": 282.58,
"r": 438.28,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 455.63,
"t": 282.46,
"r": 473.07,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 498.17,
"t": 282.46,
"r": 515.61,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 326.8,
"t": 294.53,
"r": 377.86,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 389.82,
"t": 294.53,
"r": 442.15,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 455.63,
"t": 294.53,
"r": 473.07,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 505.23,
"t": 294.53,
"r": 508.54,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 4,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 339.32,
"t": 253.66,
"r": 365.34,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 401.04,
"t": 253.66,
"r": 430.92,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 454.1,
"t": 253.66,
"r": 474.59,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "mAP",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 486.54,
"t": 253.66,
"r": 527.23,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "mAP (PP)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 327.66,
"t": 270.62,
"r": 377.0,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD+BBox",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 270.62,
"r": 438.28,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.64,
"t": 270.62,
"r": 473.07,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "79.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.17,
"t": 270.62,
"r": 515.6,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "82.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 282.58,
"r": 377.86,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.69,
"t": 282.58,
"r": 438.28,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.63,
"t": 282.46,
"r": 473.07,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "82.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.17,
"t": 282.46,
"r": 515.61,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "86.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 294.53,
"r": 377.86,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 389.82,
"t": 294.53,
"r": 442.15,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "SynthTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.63,
"t": 294.53,
"r": 473.07,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "87.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 505.23,
"t": 294.53,
"r": 508.54,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
"5": {
"label": "table",
"id": 5,
"page_no": 6,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 332.97,
"t": 540.28,
"r": 520.94,
"b": 643.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 99,
"label": "text",
"bbox": {
"l": 358.01,
"t": 552.23,
"r": 384.02,
"b": 561.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 449.03,
"t": 546.26,
"r": 473.94,
"b": 555.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 408.51,
"t": 558.21,
"r": 436.74,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 448.7,
"t": 558.21,
"r": 485.08,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 499.38,
"t": 558.21,
"r": 512.12,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 357.68,
"t": 575.17,
"r": 384.35,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 413.9,
"t": 575.17,
"r": 431.34,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 458.16,
"t": 575.17,
"r": 475.6,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 497.03,
"t": 575.17,
"r": 514.46,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 350.72,
"t": 587.12,
"r": 391.31,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 413.91,
"t": 587.12,
"r": 431.34,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 458.17,
"t": 587.12,
"r": 475.6,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 497.03,
"t": 587.12,
"r": 514.47,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 354.14,
"t": 599.08,
"r": 387.9,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 413.9,
"t": 599.08,
"r": 431.34,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 458.17,
"t": 599.08,
"r": 475.6,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 497.03,
"t": 599.08,
"r": 514.46,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 346.56,
"t": 611.03,
"r": 395.48,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 413.91,
"t": 611.03,
"r": 431.34,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 458.17,
"t": 611.03,
"r": 475.6,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 497.03,
"t": 611.03,
"r": 514.47,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 360.78,
"t": 622.99,
"r": 381.25,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 413.9,
"t": 622.99,
"r": 431.34,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 458.17,
"t": 622.99,
"r": 475.6,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 497.03,
"t": 622.99,
"r": 514.46,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 345.48,
"t": 634.94,
"r": 396.55,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 125,
"label": "text",
"bbox": {
"l": 413.91,
"t": 634.94,
"r": 431.34,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 458.17,
"t": 634.94,
"r": 475.6,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 497.03,
"t": 634.82,
"r": 514.47,
"b": 643.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 358.01,
"t": 552.23,
"r": 384.02,
"b": 561.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.03,
"t": 546.26,
"r": 473.94,
"b": 555.16,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 408.51,
"t": 558.21,
"r": 436.74,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 499.38,
"t": 558.21,
"r": 512.12,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 357.68,
"t": 575.17,
"r": 384.35,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Tabula",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 575.17,
"r": 431.34,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "78.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.16,
"t": 575.17,
"r": 475.6,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "57.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 575.17,
"r": 514.46,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "67.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 350.72,
"t": 587.12,
"r": 391.31,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Traprange",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 587.12,
"r": 431.34,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "60.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 587.12,
"r": 475.6,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "49.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 587.12,
"r": 514.47,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "55.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 354.14,
"t": 599.08,
"r": 387.9,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Camelot",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 599.08,
"r": 431.34,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "80.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 599.08,
"r": 475.6,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "66.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 599.08,
"r": 514.46,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "73.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 346.56,
"t": 611.03,
"r": 395.48,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Acrobat Pro",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 611.03,
"r": 431.34,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "68.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 611.03,
"r": 475.6,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "61.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 611.03,
"r": 514.47,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "65.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 360.78,
"t": 622.99,
"r": 381.25,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 622.99,
"r": 431.34,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "91.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 622.99,
"r": 475.6,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "85.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 622.99,
"r": 514.46,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 345.48,
"t": 634.94,
"r": 396.55,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 634.94,
"r": 431.34,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "95.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 634.94,
"r": 475.6,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "90.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 634.82,
"r": 514.47,
"b": 643.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "93.6",
"column_header": false,
"row_header": false,
"row_section": false
}
]
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "section_header",
"id": 10,
"page_no": 6,
"cluster": {
"id": 10,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 74.4,
"r": 167.9,
"b": 84.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.25,
"r_x1": 63.7,
"r_y1": 84.25,
"r_x2": 63.7,
"r_y2": 74.4,
"r_x3": 50.11,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3.",
"orig": "5.3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.77,
"r_y0": 84.25,
"r_x1": 167.9,
"r_y1": 84.25,
"r_x2": 167.9,
"r_y2": 74.4,
"r_x3": 72.77,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "Datasets and Metrics",
"orig": "Datasets and Metrics",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.3. Datasets and Metrics"
},
{
"label": "text",
"id": 1,
"page_no": 6,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 93.35,
"r": 286.37,
"b": 138.12,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 102.26,
"r_x1": 286.36,
"r_y1": 102.26,
"r_x2": 286.36,
"r_y2": 93.35,
"r_x3": 62.07,
"r_y3": 93.35,
"coord_origin": "TOPLEFT"
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 114.21,
"r_x1": 286.37,
"r_y1": 114.21,
"r_x2": 286.37,
"r_y2": 105.31,
"r_x3": 50.11,
"r_y3": 105.31,
"coord_origin": "TOPLEFT"
},
"text": "ric was introduced in [37]. It represents the prediction, and",
"orig": "ric was introduced in [37]. It represents the prediction, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 126.17,
"r_x1": 286.37,
"r_y1": 126.17,
"r_x2": 286.37,
"r_y2": 117.26,
"r_x3": 50.11,
"r_y3": 117.26,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth as a tree structure of HTML tags. This simi-",
"orig": "ground-truth as a tree structure of HTML tags. This simi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 138.12,
"r_x1": 136.72,
"r_y1": 138.12,
"r_x2": 136.72,
"r_y2": 129.22,
"r_x3": 50.11,
"r_y3": 129.22,
"coord_origin": "TOPLEFT"
},
"text": "larity is calculated as:",
"orig": "larity is calculated as:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:"
},
{
"label": "formula",
"id": 13,
"page_no": 6,
"cluster": {
"id": 13,
"label": "formula",
"bbox": {
"l": 86.22,
"t": 150.32,
"r": 286.36,
"b": 172.74,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.22,
"r_y0": 165.9,
"r_x1": 118.88,
"r_y1": 165.9,
"r_x2": 118.88,
"r_y2": 157.06,
"r_x3": 86.22,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": "TEDS (",
"orig": "TEDS (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.87,
"r_y0": 165.9,
"r_x1": 143.27,
"r_y1": 165.9,
"r_x2": 143.27,
"r_y2": 157.06,
"r_x3": 118.87,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.77,
"r_y0": 165.9,
"r_x1": 165.9,
"r_y1": 165.9,
"r_x2": 165.9,
"r_y2": 157.06,
"r_x3": 143.77,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": ") = 1",
"orig": ") = 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.12,
"r_y0": 165.9,
"r_x1": 175.87,
"r_y1": 165.9,
"r_x2": 175.87,
"r_y2": 156.5,
"r_x3": 168.12,
"r_y3": 156.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 179.28,
"r_y0": 159.16,
"r_x1": 221.96,
"r_y1": 159.16,
"r_x2": 221.96,
"r_y2": 150.32,
"r_x3": 179.28,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": "EditDist (",
"orig": "EditDist (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.95,
"r_y0": 159.16,
"r_x1": 246.35,
"r_y1": 159.16,
"r_x2": 246.35,
"r_y2": 150.32,
"r_x3": 221.95,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.84,
"r_y0": 159.16,
"r_x1": 250.72,
"r_y1": 159.16,
"r_x2": 250.72,
"r_y2": 150.32,
"r_x3": 246.84,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.21,
"r_y0": 172.74,
"r_x1": 206.29,
"r_y1": 172.74,
"r_x2": 206.29,
"r_y2": 163.89,
"r_x3": 182.21,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "max (",
"orig": "max (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.29,
"r_y0": 172.74,
"r_x1": 209.06,
"r_y1": 172.74,
"r_x2": 209.06,
"r_y2": 163.33,
"r_x3": 206.29,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.06,
"r_y0": 172.74,
"r_x1": 219.2,
"r_y1": 172.74,
"r_x2": 219.2,
"r_y2": 163.89,
"r_x3": 209.06,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.7,
"r_y0": 172.74,
"r_x1": 222.46,
"r_y1": 172.74,
"r_x2": 222.46,
"r_y2": 163.33,
"r_x3": 219.7,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.12,
"r_y0": 172.74,
"r_x1": 226.89,
"r_y1": 172.74,
"r_x2": 226.89,
"r_y2": 163.89,
"r_x3": 224.12,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.55,
"r_y0": 172.74,
"r_x1": 231.32,
"r_y1": 172.74,
"r_x2": 231.32,
"r_y2": 163.33,
"r_x3": 228.55,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.32,
"r_y0": 172.74,
"r_x1": 240.65,
"r_y1": 172.74,
"r_x2": 240.65,
"r_y2": 163.89,
"r_x3": 231.32,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.14,
"r_y0": 172.74,
"r_x1": 243.91,
"r_y1": 172.74,
"r_x2": 243.91,
"r_y2": 163.33,
"r_x3": 241.14,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.91,
"r_y0": 172.74,
"r_x1": 247.79,
"r_y1": 172.74,
"r_x2": 247.79,
"r_y2": 163.89,
"r_x3": 243.91,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 166.12,
"r_x1": 286.36,
"r_y1": 166.12,
"r_x2": 286.36,
"r_y2": 157.22,
"r_x3": 274.75,
"r_y3": 157.22,
"coord_origin": "TOPLEFT"
},
"text": "(3)",
"orig": "(3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TEDS ( T$_{a}$, T$_{b}$ ) = 1 \u2212 EditDist ( T$_{a}$, T$_{b}$ ) max ( | T$_{a}$ | , | T$_{b}$ | ) (3)"
},
{
"label": "text",
"id": 6,
"page_no": 6,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 50.11,
"t": 181.0,
"r": 286.36,
"b": 213.98,
"coord_origin": "TOPLEFT"
},
"confidence": 0.974,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 190.07,
"r_x1": 86.41,
"r_y1": 190.07,
"r_x2": 86.41,
"r_y2": 181.16,
"r_x3": 62.07,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.58,
"r_y0": 189.85,
"r_x1": 98.72,
"r_y1": 189.85,
"r_x2": 98.72,
"r_y2": 181.0,
"r_x3": 88.58,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.4,
"r_y0": 190.07,
"r_x1": 115.78,
"r_y1": 190.07,
"r_x2": 115.78,
"r_y2": 181.16,
"r_x3": 101.4,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.96,
"r_y0": 189.85,
"r_x1": 127.29,
"r_y1": 189.85,
"r_x2": 127.29,
"r_y2": 181.0,
"r_x3": 117.96,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.96,
"r_y0": 190.07,
"r_x1": 286.36,
"r_y1": 190.07,
"r_x2": 286.36,
"r_y2": 181.16,
"r_x3": 129.96,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "represent tables in tree structure HTML",
"orig": "represent tables in tree structure HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 202.02,
"r_x1": 252.78,
"r_y1": 202.02,
"r_x2": 252.78,
"r_y2": 193.12,
"r_x3": 50.11,
"r_y3": 193.12,
"coord_origin": "TOPLEFT"
},
"text": "format. EditDist denotes the tree-edit distance, and",
"orig": "format. EditDist denotes the tree-edit distance, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.18,
"r_y0": 201.8,
"r_x1": 257.95,
"r_y1": 201.8,
"r_x2": 257.95,
"r_y2": 192.4,
"r_x3": 255.18,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 257.95,
"r_y0": 201.8,
"r_x1": 263.77,
"r_y1": 201.8,
"r_x2": 263.77,
"r_y2": 192.96,
"r_x3": 257.95,
"r_y3": 192.96,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 265.15,
"r_y0": 201.8,
"r_x1": 267.92,
"r_y1": 201.8,
"r_x2": 267.92,
"r_y2": 192.4,
"r_x3": 265.15,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.32,
"r_y0": 202.02,
"r_x1": 286.36,
"r_y1": 202.02,
"r_x2": 286.36,
"r_y2": 193.12,
"r_x3": 270.32,
"r_y3": 193.12,
"coord_origin": "TOPLEFT"
},
"text": "rep-",
"orig": "rep-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 213.98,
"r_x1": 172.13,
"r_y1": 213.98,
"r_x2": 172.13,
"r_y2": 205.07,
"r_x3": 50.11,
"r_y3": 205.07,
"coord_origin": "TOPLEFT"
},
"text": "resents the number of nodes in",
"orig": "resents the number of nodes in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.62,
"r_y0": 213.76,
"r_x1": 180.45,
"r_y1": 213.76,
"r_x2": 180.45,
"r_y2": 204.91,
"r_x3": 174.62,
"r_y3": 204.91,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.83,
"r_y0": 213.98,
"r_x1": 184.32,
"r_y1": 213.98,
"r_x2": 184.32,
"r_y2": 205.07,
"r_x3": 181.83,
"r_y3": 205.07,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where T$_{a}$ and T$_{b}$ represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ."
},
{
"label": "section_header",
"id": 9,
"page_no": 6,
"cluster": {
"id": 9,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 224.82,
"r": 170.45,
"b": 234.67,
"coord_origin": "TOPLEFT"
},
"confidence": 0.959,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 234.67,
"r_x1": 64.55,
"r_y1": 234.67,
"r_x2": 64.55,
"r_y2": 224.82,
"r_x3": 50.11,
"r_y3": 224.82,
"coord_origin": "TOPLEFT"
},
"text": "5.4.",
"orig": "5.4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.18,
"r_y0": 234.67,
"r_x1": 170.45,
"r_y1": 234.67,
"r_x2": 170.45,
"r_y2": 224.82,
"r_x3": 74.18,
"r_y3": 224.82,
"coord_origin": "TOPLEFT"
},
"text": "Quantitative Analysis",
"orig": "Quantitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.4. Quantitative Analysis"
},
{
"label": "text",
"id": 2,
"page_no": 6,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 243.65,
"r": 286.37,
"b": 396.14,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 252.61,
"r_x1": 105.32,
"r_y1": 252.61,
"r_x2": 105.32,
"r_y2": 243.65,
"r_x3": 62.07,
"r_y3": 243.65,
"coord_origin": "TOPLEFT"
},
"text": "Structure.",
"orig": "Structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.13,
"r_y0": 252.68,
"r_x1": 184.68,
"r_y1": 252.68,
"r_x2": 184.68,
"r_y2": 243.77,
"r_x3": 112.13,
"r_y3": 243.77,
"coord_origin": "TOPLEFT"
},
"text": "As shown in Tab.",
"orig": "As shown in Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 191.48,
"r_y0": 252.68,
"r_x1": 286.36,
"r_y1": 252.68,
"r_x2": 286.36,
"r_y2": 243.77,
"r_x3": 191.48,
"r_y3": 243.77,
"coord_origin": "TOPLEFT"
},
"text": "2, TableFormer outper-",
"orig": "2, TableFormer outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.63,
"r_x1": 286.37,
"r_y1": 264.63,
"r_x2": 286.37,
"r_y2": 255.72,
"r_x3": 50.11,
"r_y3": 255.72,
"coord_origin": "TOPLEFT"
},
"text": "forms all SOTA methods across different datasets by a large",
"orig": "forms all SOTA methods across different datasets by a large",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.59,
"r_x1": 286.37,
"r_y1": 276.59,
"r_x2": 286.37,
"r_y2": 267.68,
"r_x3": 50.11,
"r_y3": 267.68,
"coord_origin": "TOPLEFT"
},
"text": "margin for predicting the table structure from an image.",
"orig": "margin for predicting the table structure from an image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.54,
"r_x1": 286.37,
"r_y1": 288.54,
"r_x2": 286.37,
"r_y2": 279.63,
"r_x3": 50.11,
"r_y3": 279.63,
"coord_origin": "TOPLEFT"
},
"text": "All the more, our model outperforms pre-trained methods.",
"orig": "All the more, our model outperforms pre-trained methods.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.5,
"r_x1": 286.37,
"r_y1": 300.5,
"r_x2": 286.37,
"r_y2": 291.59,
"r_x3": 50.11,
"r_y3": 291.59,
"coord_origin": "TOPLEFT"
},
"text": "During the evaluation we do not apply any table filtering.",
"orig": "During the evaluation we do not apply any table filtering.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.45,
"r_x1": 286.37,
"r_y1": 312.45,
"r_x2": 286.37,
"r_y2": 303.55,
"r_x3": 50.11,
"r_y3": 303.55,
"coord_origin": "TOPLEFT"
},
"text": "We also provide our baseline results on the SynthTabNet",
"orig": "We also provide our baseline results on the SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.41,
"r_x1": 286.37,
"r_y1": 324.41,
"r_x2": 286.37,
"r_y2": 315.5,
"r_x3": 50.11,
"r_y3": 315.5,
"coord_origin": "TOPLEFT"
},
"text": "dataset. It has been observed that large tables (e.g. tables",
"orig": "dataset. It has been observed that large tables (e.g. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.36,
"r_x1": 286.37,
"r_y1": 336.36,
"r_x2": 286.37,
"r_y2": 327.46,
"r_x3": 50.11,
"r_y3": 327.46,
"coord_origin": "TOPLEFT"
},
"text": "that occupy half of the page or more) yield poor predictions.",
"orig": "that occupy half of the page or more) yield poor predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.32,
"r_x1": 286.37,
"r_y1": 348.32,
"r_x2": 286.37,
"r_y2": 339.41,
"r_x3": 50.11,
"r_y3": 339.41,
"coord_origin": "TOPLEFT"
},
"text": "We attribute this issue to the image resizing during the pre-",
"orig": "We attribute this issue to the image resizing during the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 360.27,
"r_x1": 286.37,
"r_y1": 360.27,
"r_x2": 286.37,
"r_y2": 351.37,
"r_x3": 50.11,
"r_y3": 351.37,
"coord_origin": "TOPLEFT"
},
"text": "processing step, that produces downsampled images with",
"orig": "processing step, that produces downsampled images with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 372.23,
"r_x1": 286.37,
"r_y1": 372.23,
"r_x2": 286.37,
"r_y2": 363.32,
"r_x3": 50.11,
"r_y3": 363.32,
"coord_origin": "TOPLEFT"
},
"text": "indistinguishable features. This problem can be addressed",
"orig": "indistinguishable features. This problem can be addressed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 384.18,
"r_x1": 286.37,
"r_y1": 384.18,
"r_x2": 286.37,
"r_y2": 375.28,
"r_x3": 50.11,
"r_y3": 375.28,
"coord_origin": "TOPLEFT"
},
"text": "by treating such big tables with a separate model which ac-",
"orig": "by treating such big tables with a separate model which ac-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.14,
"r_x1": 170.01,
"r_y1": 396.14,
"r_x2": 170.01,
"r_y2": 387.23,
"r_x3": 50.11,
"r_y3": 387.23,
"coord_origin": "TOPLEFT"
},
"text": "cepts a large input image size.",
"orig": "cepts a large input image size.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size."
},
{
"label": "table",
"id": 0,
"page_no": 6,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 53.37,
"t": 409.14,
"r": 283.04,
"b": 582.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.989,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 27,
"label": "text",
"bbox": {
"l": 78.84,
"t": 420.69,
"r": 104.86,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 211.2,
"t": 414.71,
"r": 236.11,
"b": 423.62,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 129.34,
"t": 426.67,
"r": 159.22,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 171.17,
"t": 426.67,
"r": 199.4,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 211.36,
"t": 426.67,
"r": 247.74,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 264.54,
"t": 426.67,
"r": 277.27,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 81.61,
"t": 443.62,
"r": 102.09,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 134.87,
"t": 443.62,
"r": 153.69,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 176.57,
"t": 443.62,
"r": 194.0,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 220.83,
"t": 443.62,
"r": 238.26,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 262.18,
"t": 443.62,
"r": 279.62,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 82.17,
"t": 455.58,
"r": 101.53,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 134.87,
"t": 455.58,
"r": 153.69,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 183.62,
"t": 455.58,
"r": 186.94,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 227.89,
"t": 455.58,
"r": 231.21,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 259.7,
"t": 455.58,
"r": 282.11,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 66.32,
"t": 468.13,
"r": 117.38,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 134.87,
"t": 468.13,
"r": 153.69,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 176.57,
"t": 468.13,
"r": 194.01,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 220.83,
"t": 468.13,
"r": 238.27,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 259.7,
"t": 468.01,
"r": 282.11,
"b": 476.97,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 81.61,
"t": 483.33,
"r": 102.09,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 134.87,
"t": 483.33,
"r": 153.69,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 176.57,
"t": 483.33,
"r": 194.0,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 218.34,
"t": 483.33,
"r": 240.75,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 262.18,
"t": 483.33,
"r": 279.62,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 82.17,
"t": 495.28,
"r": 101.53,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 134.87,
"t": 495.28,
"r": 153.69,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 183.62,
"t": 495.28,
"r": 186.94,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 227.89,
"t": 495.28,
"r": 231.21,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 259.7,
"t": 495.28,
"r": 282.11,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 71.79,
"t": 507.24,
"r": 111.91,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 134.86,
"t": 507.24,
"r": 153.68,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 183.63,
"t": 507.24,
"r": 186.95,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 227.89,
"t": 507.24,
"r": 231.21,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 259.69,
"t": 507.24,
"r": 282.11,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 66.32,
"t": 519.19,
"r": 117.38,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 134.87,
"t": 519.19,
"r": 153.69,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 176.57,
"t": 519.19,
"r": 194.01,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 220.83,
"t": 519.19,
"r": 238.27,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 262.19,
"t": 519.07,
"r": 279.62,
"b": 528.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 81.61,
"t": 536.5,
"r": 102.09,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 137.91,
"t": 536.5,
"r": 150.64,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 176.57,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 227.89,
"t": 536.5,
"r": 231.21,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 262.18,
"t": 536.5,
"r": 279.62,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 66.32,
"t": 548.45,
"r": 117.38,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 137.91,
"t": 548.45,
"r": 150.64,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 176.57,
"t": 548.45,
"r": 194.01,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 227.89,
"t": 548.45,
"r": 231.21,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 262.19,
"t": 548.33,
"r": 279.62,
"b": 557.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 66.32,
"t": 568.0,
"r": 117.38,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 134.87,
"t": 568.0,
"r": 153.69,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 176.57,
"t": 568.0,
"r": 194.01,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 220.83,
"t": 568.0,
"r": 238.27,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 262.19,
"t": 568.0,
"r": 279.62,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 11,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 78.84,
"t": 420.69,
"r": 104.86,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 211.2,
"t": 414.71,
"r": 236.11,
"b": 423.62,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 129.34,
"t": 426.67,
"r": 159.22,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 171.17,
"t": 426.67,
"r": 199.4,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 264.54,
"t": 426.67,
"r": 277.27,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 443.62,
"r": 102.09,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 443.62,
"r": 153.69,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 443.62,
"r": 194.0,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "91.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 443.62,
"r": 238.26,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 443.62,
"r": 279.62,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.17,
"t": 455.58,
"r": 101.53,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 455.58,
"r": 153.69,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.62,
"t": 455.58,
"r": 186.94,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 455.58,
"r": 231.21,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 455.58,
"r": 282.11,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "93.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 468.13,
"r": 117.38,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 468.13,
"r": 153.69,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 468.13,
"r": 194.01,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "98.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 468.13,
"r": 238.27,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 468.01,
"r": 282.11,
"b": 476.97,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.75",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 483.33,
"r": 102.09,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 483.33,
"r": 153.69,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 483.33,
"r": 194.0,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "88.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 218.34,
"t": 483.33,
"r": 240.75,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "92.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 483.33,
"r": 279.62,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "90.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.17,
"t": 495.28,
"r": 101.53,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 495.28,
"r": 153.69,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.62,
"t": 495.28,
"r": 186.94,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 495.28,
"r": 231.21,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 495.28,
"r": 282.11,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "87.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 71.79,
"t": 507.24,
"r": 111.91,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE (FT)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.86,
"t": 507.24,
"r": 153.68,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.63,
"t": 507.24,
"r": 186.95,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 507.24,
"r": 231.21,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.69,
"t": 507.24,
"r": 282.11,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "91.02",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 519.19,
"r": 117.38,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 519.19,
"r": 153.69,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 519.19,
"r": 194.01,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "97.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 519.19,
"r": 238.27,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 519.07,
"r": 279.62,
"b": 528.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 536.5,
"r": 102.09,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.91,
"t": 536.5,
"r": 150.64,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 536.5,
"r": 231.21,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 536.5,
"r": 279.62,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 548.45,
"r": 117.38,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.91,
"t": 548.45,
"r": 150.64,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 548.45,
"r": 194.01,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 548.45,
"r": 231.21,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 548.33,
"r": 279.62,
"b": 557.29,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 568.0,
"r": 117.38,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 568.0,
"r": 153.69,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "STN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 568.0,
"r": 194.01,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "96.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 568.0,
"r": 238.27,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 568.0,
"r": 279.62,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.7",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "text",
"id": 15,
"page_no": 6,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 50.11,
"t": 592.43,
"r": 286.37,
"b": 613.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.721,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 601.34,
"r_x1": 286.37,
"r_y1": 601.34,
"r_x2": 286.37,
"r_y2": 592.43,
"r_x3": 50.11,
"r_y3": 592.43,
"coord_origin": "TOPLEFT"
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 613.29,
"r_x1": 247.46,
"r_y1": 613.29,
"r_x2": 247.46,
"r_y2": 604.39,
"r_x3": 50.11,
"r_y3": 604.39,
"coord_origin": "TOPLEFT"
},
"text": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"orig": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)."
},
{
"label": "text",
"id": 16,
"page_no": 6,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 50.11,
"t": 616.34,
"r": 261.79,
"b": 625.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.643,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 625.25,
"r_x1": 261.79,
"r_y1": 625.25,
"r_x2": 261.79,
"r_y2": 616.34,
"r_x3": 50.11,
"r_y3": 616.34,
"coord_origin": "TOPLEFT"
},
"text": "FT: Model was trained on PubTabNet then finetuned.",
"orig": "FT: Model was trained on PubTabNet then finetuned.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "FT: Model was trained on PubTabNet then finetuned."
},
{
"label": "text",
"id": 3,
"page_no": 6,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 644.35,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 653.31,
"r_x1": 124.72,
"r_y1": 653.31,
"r_x2": 124.72,
"r_y2": 644.35,
"r_x3": 62.07,
"r_y3": 644.35,
"coord_origin": "TOPLEFT"
},
"text": "Cell Detection.",
"orig": "Cell Detection.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.2,
"r_y0": 653.38,
"r_x1": 242.93,
"r_y1": 653.38,
"r_x2": 242.93,
"r_y2": 644.47,
"r_x3": 128.2,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "Like any object detector, our",
"orig": "Like any object detector, our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.55,
"r_y0": 653.15,
"r_x1": 286.36,
"r_y1": 653.15,
"r_x2": 286.36,
"r_y2": 644.56,
"r_x3": 245.55,
"r_y3": 644.56,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.1,
"r_x1": 84.97,
"r_y1": 665.1,
"r_x2": 84.97,
"r_y2": 656.51,
"r_x3": 50.11,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "Detector",
"orig": "Detector",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.52,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 89.52,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "provides bounding boxes that can be improved",
"orig": "provides bounding boxes that can be improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "with post-processing during inference. We make use of the",
"orig": "with post-processing during inference. We make use of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "grid-like structure of tables to refine the predictions. A de-",
"orig": "grid-like structure of tables to refine the predictions. A de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "tailed explanation on the post-processing is available in the",
"orig": "tailed explanation on the post-processing is available in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "supplementary material. As shown in Tab. 3, we evaluate",
"orig": "supplementary material. As shown in Tab. 3, we evaluate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate"
},
{
"label": "text",
"id": 7,
"page_no": 6,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 227.58,
"coord_origin": "TOPLEFT"
},
"confidence": 0.971,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 322.14,
"r_y1": 84.11,
"r_x2": 322.14,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "our",
"orig": "our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.45,
"r_y0": 83.89,
"r_x1": 404.57,
"r_y1": 83.89,
"r_x2": 404.57,
"r_y2": 75.3,
"r_x3": 325.45,
"r_y3": 75.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 84.11,
"r_x1": 545.11,
"r_y1": 84.11,
"r_x2": 545.11,
"r_y2": 75.21,
"r_x3": 408.1,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "accuracy for cells with a class la-",
"orig": "accuracy for cells with a class la-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 470.23,
"r_y1": 108.02,
"r_x2": 470.23,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "for pre-processing and post-processing.",
"orig": "for pre-processing and post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.53,
"r_y0": 108.02,
"r_x1": 545.12,
"r_y1": 108.02,
"r_x2": 545.12,
"r_y2": 99.12,
"r_x3": 477.53,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "Note that we do",
"orig": "Note that we do",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 119.98,
"r_x1": 545.12,
"r_y1": 119.98,
"r_x2": 545.12,
"r_y2": 111.07,
"r_x3": 308.86,
"r_y3": 111.07,
"coord_origin": "TOPLEFT"
},
"text": "not have post-processing results for SynthTabNet as images",
"orig": "not have post-processing results for SynthTabNet as images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 131.93,
"r_x1": 545.12,
"r_y1": 131.93,
"r_x2": 545.12,
"r_y2": 123.03,
"r_x3": 308.86,
"r_y3": 123.03,
"coord_origin": "TOPLEFT"
},
"text": "are only provided. To compare the performance of our pro-",
"orig": "are only provided. To compare the performance of our pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 143.89,
"r_x1": 502.02,
"r_y1": 143.89,
"r_x2": 502.02,
"r_y2": 134.98,
"r_x3": 308.86,
"r_y3": 134.98,
"coord_origin": "TOPLEFT"
},
"text": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"orig": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 504.47,
"r_y0": 143.66,
"r_x1": 545.11,
"r_y1": 143.66,
"r_x2": 545.11,
"r_y2": 135.07,
"r_x3": 504.47,
"r_y3": 135.07,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 155.62,
"r_x1": 343.16,
"r_y1": 155.62,
"r_x2": 343.16,
"r_y2": 147.03,
"r_x3": 308.86,
"r_y3": 147.03,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.37,
"r_y0": 155.85,
"r_x1": 545.11,
"r_y1": 155.85,
"r_x2": 545.11,
"r_y2": 146.94,
"r_x3": 346.37,
"r_y3": 146.94,
"coord_origin": "TOPLEFT"
},
"text": "into EDD architecture. As mentioned previously,",
"orig": "into EDD architecture. As mentioned previously,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 167.8,
"r_x1": 446.16,
"r_y1": 167.8,
"r_x2": 446.16,
"r_y2": 158.89,
"r_x3": 308.86,
"r_y3": 158.89,
"coord_origin": "TOPLEFT"
},
"text": "the Structure Decoder provides the",
"orig": "the Structure Decoder provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.29,
"r_y0": 167.57,
"r_x1": 525.04,
"r_y1": 167.57,
"r_x2": 525.04,
"r_y2": 158.98,
"r_x3": 448.29,
"r_y3": 158.98,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.4,
"r_y0": 167.8,
"r_x1": 545.11,
"r_y1": 167.8,
"r_x2": 545.11,
"r_y2": 158.89,
"r_x3": 527.4,
"r_y3": 158.89,
"coord_origin": "TOPLEFT"
},
"text": "with",
"orig": "with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 179.76,
"r_x1": 545.12,
"r_y1": 179.76,
"r_x2": 545.12,
"r_y2": 170.85,
"r_x3": 308.86,
"r_y3": 170.85,
"coord_origin": "TOPLEFT"
},
"text": "the features needed to predict the bounding box predictions.",
"orig": "the features needed to predict the bounding box predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 191.71,
"r_x1": 432.87,
"r_y1": 191.71,
"r_x2": 432.87,
"r_y2": 182.8,
"r_x3": 308.86,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "Therefore, the accuracy of the",
"orig": "Therefore, the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.39,
"r_y0": 191.48,
"r_x1": 510.93,
"r_y1": 191.48,
"r_x2": 510.93,
"r_y2": 182.89,
"r_x3": 436.39,
"r_y3": 182.89,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.68,
"r_y0": 191.71,
"r_x1": 545.11,
"r_y1": 191.71,
"r_x2": 545.11,
"r_y2": 182.8,
"r_x3": 514.68,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "directly",
"orig": "directly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 203.67,
"r_x1": 431.17,
"r_y1": 203.67,
"r_x2": 431.17,
"r_y2": 194.76,
"r_x3": 308.86,
"r_y3": 194.76,
"coord_origin": "TOPLEFT"
},
"text": "influences the accuracy of the",
"orig": "influences the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.68,
"r_y0": 203.44,
"r_x1": 514.18,
"r_y1": 203.44,
"r_x2": 514.18,
"r_y2": 194.85,
"r_x3": 434.68,
"r_y3": 194.85,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.18,
"r_y0": 203.67,
"r_x1": 545.11,
"r_y1": 203.67,
"r_x2": 545.11,
"r_y2": 194.76,
"r_x3": 514.18,
"r_y3": 194.76,
"coord_origin": "TOPLEFT"
},
"text": ". If the",
"orig": ". If the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 215.39,
"r_x1": 382.36,
"r_y1": 215.39,
"r_x2": 382.36,
"r_y2": 206.81,
"r_x3": 308.86,
"r_y3": 206.81,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.08,
"r_y0": 215.62,
"r_x1": 545.11,
"r_y1": 215.62,
"r_x2": 545.11,
"r_y2": 206.72,
"r_x3": 385.08,
"r_y3": 206.72,
"coord_origin": "TOPLEFT"
},
"text": "predicts an extra column, this will result",
"orig": "predicts an extra column, this will result",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 227.58,
"r_x1": 501.7,
"r_y1": 227.58,
"r_x2": 501.7,
"r_y2": 218.67,
"r_x3": 308.86,
"r_y3": 218.67,
"coord_origin": "TOPLEFT"
},
"text": "in an extra column of predicted bounding boxes.",
"orig": "in an extra column of predicted bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes."
},
{
"label": "table",
"id": 8,
"page_no": 6,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 308.41,
"t": 247.88,
"r": 533.64,
"b": 303.81,
"coord_origin": "TOPLEFT"
},
"confidence": 0.969,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 339.32,
"t": 253.66,
"r": 365.34,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 401.04,
"t": 253.66,
"r": 430.92,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 454.1,
"t": 253.66,
"r": 474.59,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 486.54,
"t": 253.66,
"r": 527.23,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 327.66,
"t": 270.62,
"r": 377.0,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 393.7,
"t": 270.62,
"r": 438.28,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 455.64,
"t": 270.62,
"r": 473.07,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 498.17,
"t": 270.62,
"r": 515.6,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.8,
"t": 282.58,
"r": 377.86,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 393.69,
"t": 282.58,
"r": 438.28,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 455.63,
"t": 282.46,
"r": 473.07,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 498.17,
"t": 282.46,
"r": 515.61,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 326.8,
"t": 294.53,
"r": 377.86,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 389.82,
"t": 294.53,
"r": 442.15,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 455.63,
"t": 294.53,
"r": 473.07,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 505.23,
"t": 294.53,
"r": 508.54,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 4,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 339.32,
"t": 253.66,
"r": 365.34,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 401.04,
"t": 253.66,
"r": 430.92,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 454.1,
"t": 253.66,
"r": 474.59,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "mAP",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 486.54,
"t": 253.66,
"r": 527.23,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "mAP (PP)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 327.66,
"t": 270.62,
"r": 377.0,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD+BBox",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 270.62,
"r": 438.28,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.64,
"t": 270.62,
"r": 473.07,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "79.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.17,
"t": 270.62,
"r": 515.6,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "82.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 282.58,
"r": 377.86,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.69,
"t": 282.58,
"r": 438.28,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.63,
"t": 282.46,
"r": 473.07,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "82.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.17,
"t": 282.46,
"r": 515.61,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "86.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 294.53,
"r": 377.86,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 389.82,
"t": 294.53,
"r": 442.15,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "SynthTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.63,
"t": 294.53,
"r": 473.07,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "87.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 505.23,
"t": 294.53,
"r": 508.54,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 12,
"page_no": 6,
"cluster": {
"id": 12,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 316.45,
"r": 545.12,
"b": 337.31,
"coord_origin": "TOPLEFT"
},
"confidence": 0.952,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 325.36,
"r_x1": 341.5,
"r_y1": 325.36,
"r_x2": 341.5,
"r_y2": 316.45,
"r_x3": 308.86,
"r_y3": 316.45,
"coord_origin": "TOPLEFT"
},
"text": "Table 3:",
"orig": "Table 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.6,
"r_y0": 325.36,
"r_x1": 545.12,
"r_y1": 325.36,
"r_x2": 545.12,
"r_y2": 316.45,
"r_x3": 348.6,
"r_y3": 316.45,
"coord_origin": "TOPLEFT"
},
"text": "Cell Bounding Box detection results on PubTab-",
"orig": "Cell Bounding Box detection results on PubTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 337.31,
"r_x1": 474.98,
"r_y1": 337.31,
"r_x2": 474.98,
"r_y2": 328.4,
"r_x3": 308.86,
"r_y3": 328.4,
"coord_origin": "TOPLEFT"
},
"text": "Net, and FinTabNet. PP: Post-processing.",
"orig": "Net, and FinTabNet. PP: Post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing."
},
{
"label": "text",
"id": 4,
"page_no": 6,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.86,
"t": 367.68,
"r": 545.12,
"b": 520.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 376.64,
"r_x1": 378.95,
"r_y1": 376.64,
"r_x2": 378.95,
"r_y2": 367.68,
"r_x3": 320.82,
"r_y3": 367.68,
"coord_origin": "TOPLEFT"
},
"text": "Cell Content.",
"orig": "Cell Content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 387.08,
"r_y0": 376.71,
"r_x1": 545.12,
"r_y1": 376.71,
"r_x2": 545.12,
"r_y2": 367.8,
"r_x3": 387.08,
"r_y3": 367.8,
"coord_origin": "TOPLEFT"
},
"text": "In this section, we evaluate the entire",
"orig": "In this section, we evaluate the entire",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 388.66,
"r_x1": 487.19,
"r_y1": 388.66,
"r_x2": 487.19,
"r_y2": 379.75,
"r_x3": 308.86,
"r_y3": 379.75,
"coord_origin": "TOPLEFT"
},
"text": "pipeline of recovering a table with content.",
"orig": "pipeline of recovering a table with content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.97,
"r_y0": 388.66,
"r_x1": 545.12,
"r_y1": 388.66,
"r_x2": 545.12,
"r_y2": 379.75,
"r_x3": 493.97,
"r_y3": 379.75,
"coord_origin": "TOPLEFT"
},
"text": "Here we put",
"orig": "Here we put",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.62,
"r_x1": 545.12,
"r_y1": 400.62,
"r_x2": 545.12,
"r_y2": 391.71,
"r_x3": 308.86,
"r_y3": 391.71,
"coord_origin": "TOPLEFT"
},
"text": "our approach to test by capitalizing on extracting content",
"orig": "our approach to test by capitalizing on extracting content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.57,
"r_x1": 545.12,
"r_y1": 412.57,
"r_x2": 545.12,
"r_y2": 403.67,
"r_x3": 308.86,
"r_y3": 403.67,
"coord_origin": "TOPLEFT"
},
"text": "from the PDF cells rather than decoding from images. Tab.",
"orig": "from the PDF cells rather than decoding from images. Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.53,
"r_x1": 314.08,
"r_y1": 424.53,
"r_x2": 314.08,
"r_y2": 415.62,
"r_x3": 308.86,
"r_y3": 415.62,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.69,
"r_y0": 424.53,
"r_x1": 545.12,
"r_y1": 424.53,
"r_x2": 545.12,
"r_y2": 415.62,
"r_x3": 316.69,
"r_y3": 415.62,
"coord_origin": "TOPLEFT"
},
"text": "shows the TEDs score of HTML code representing the",
"orig": "shows the TEDs score of HTML code representing the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.48,
"r_x1": 545.12,
"r_y1": 436.48,
"r_x2": 545.12,
"r_y2": 427.58,
"r_x3": 308.86,
"r_y3": 427.58,
"coord_origin": "TOPLEFT"
},
"text": "structure of the table along with the content inserted in the",
"orig": "structure of the table along with the content inserted in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.44,
"r_x1": 545.12,
"r_y1": 448.44,
"r_x2": 545.12,
"r_y2": 439.53,
"r_x3": 308.86,
"r_y3": 439.53,
"coord_origin": "TOPLEFT"
},
"text": "data cell and compared with the ground-truth. Our method",
"orig": "data cell and compared with the ground-truth. Our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 460.39,
"r_x1": 350.24,
"r_y1": 460.39,
"r_x2": 350.24,
"r_y2": 451.49,
"r_x3": 308.86,
"r_y3": 451.49,
"coord_origin": "TOPLEFT"
},
"text": "achieved a",
"orig": "achieved a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.18,
"r_y0": 460.32,
"r_x1": 374.59,
"r_y1": 460.32,
"r_x2": 374.59,
"r_y2": 451.37,
"r_x3": 352.18,
"r_y3": 451.37,
"coord_origin": "TOPLEFT"
},
"text": "5.3%",
"orig": "5.3%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.53,
"r_y0": 460.39,
"r_x1": 545.11,
"r_y1": 460.39,
"r_x2": 545.11,
"r_y2": 451.49,
"r_x3": 376.53,
"r_y3": 451.49,
"coord_origin": "TOPLEFT"
},
"text": "increase over the state-of-the-art, and com-",
"orig": "increase over the state-of-the-art, and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 472.35,
"r_x1": 545.12,
"r_y1": 472.35,
"r_x2": 545.12,
"r_y2": 463.44,
"r_x3": 308.86,
"r_y3": 463.44,
"coord_origin": "TOPLEFT"
},
"text": "mercial solutions. We believe our scores would be higher",
"orig": "mercial solutions. We believe our scores would be higher",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 484.3,
"r_x1": 545.12,
"r_y1": 484.3,
"r_x2": 545.12,
"r_y2": 475.4,
"r_x3": 308.86,
"r_y3": 475.4,
"coord_origin": "TOPLEFT"
},
"text": "if the HTML ground-truth matched the extracted PDF cell",
"orig": "if the HTML ground-truth matched the extracted PDF cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 496.26,
"r_x1": 545.12,
"r_y1": 496.26,
"r_x2": 545.12,
"r_y2": 487.35,
"r_x3": 308.86,
"r_y3": 487.35,
"coord_origin": "TOPLEFT"
},
"text": "content. Unfortunately, there are small discrepancies such",
"orig": "content. Unfortunately, there are small discrepancies such",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 508.21,
"r_x1": 545.12,
"r_y1": 508.21,
"r_x2": 545.12,
"r_y2": 499.31,
"r_x3": 308.86,
"r_y3": 499.31,
"coord_origin": "TOPLEFT"
},
"text": "as spacings around words or special characters with various",
"orig": "as spacings around words or special characters with various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 520.17,
"r_x1": 405.7,
"r_y1": 520.17,
"r_x2": 405.7,
"r_y2": 511.26,
"r_x3": 308.86,
"r_y3": 511.26,
"coord_origin": "TOPLEFT"
},
"text": "unicode representations.",
"orig": "unicode representations.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations."
},
{
"label": "table",
"id": 5,
"page_no": 6,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 332.97,
"t": 540.28,
"r": 520.94,
"b": 643.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 99,
"label": "text",
"bbox": {
"l": 358.01,
"t": 552.23,
"r": 384.02,
"b": 561.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 449.03,
"t": 546.26,
"r": 473.94,
"b": 555.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 408.51,
"t": 558.21,
"r": 436.74,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 448.7,
"t": 558.21,
"r": 485.08,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 499.38,
"t": 558.21,
"r": 512.12,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 357.68,
"t": 575.17,
"r": 384.35,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 413.9,
"t": 575.17,
"r": 431.34,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 458.16,
"t": 575.17,
"r": 475.6,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 497.03,
"t": 575.17,
"r": 514.46,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 350.72,
"t": 587.12,
"r": 391.31,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 413.91,
"t": 587.12,
"r": 431.34,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 458.17,
"t": 587.12,
"r": 475.6,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 497.03,
"t": 587.12,
"r": 514.47,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 354.14,
"t": 599.08,
"r": 387.9,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 413.9,
"t": 599.08,
"r": 431.34,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 458.17,
"t": 599.08,
"r": 475.6,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 497.03,
"t": 599.08,
"r": 514.46,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 346.56,
"t": 611.03,
"r": 395.48,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 413.91,
"t": 611.03,
"r": 431.34,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 458.17,
"t": 611.03,
"r": 475.6,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 497.03,
"t": 611.03,
"r": 514.47,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 360.78,
"t": 622.99,
"r": 381.25,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 413.9,
"t": 622.99,
"r": 431.34,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 458.17,
"t": 622.99,
"r": 475.6,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 497.03,
"t": 622.99,
"r": 514.46,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 345.48,
"t": 634.94,
"r": 396.55,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 125,
"label": "text",
"bbox": {
"l": 413.91,
"t": 634.94,
"r": 431.34,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 458.17,
"t": 634.94,
"r": 475.6,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 497.03,
"t": 634.82,
"r": 514.47,
"b": 643.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 358.01,
"t": 552.23,
"r": 384.02,
"b": 561.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.03,
"t": 546.26,
"r": 473.94,
"b": 555.16,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 408.51,
"t": 558.21,
"r": 436.74,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 499.38,
"t": 558.21,
"r": 512.12,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 357.68,
"t": 575.17,
"r": 384.35,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Tabula",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 575.17,
"r": 431.34,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "78.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.16,
"t": 575.17,
"r": 475.6,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "57.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 575.17,
"r": 514.46,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "67.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 350.72,
"t": 587.12,
"r": 391.31,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Traprange",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 587.12,
"r": 431.34,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "60.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 587.12,
"r": 475.6,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "49.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 587.12,
"r": 514.47,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "55.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 354.14,
"t": 599.08,
"r": 387.9,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Camelot",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 599.08,
"r": 431.34,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "80.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 599.08,
"r": 475.6,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "66.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 599.08,
"r": 514.46,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "73.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 346.56,
"t": 611.03,
"r": 395.48,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Acrobat Pro",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 611.03,
"r": 431.34,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "68.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 611.03,
"r": 475.6,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "61.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 611.03,
"r": 514.47,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "65.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 360.78,
"t": 622.99,
"r": 381.25,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 622.99,
"r": 431.34,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "91.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 622.99,
"r": 475.6,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "85.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 622.99,
"r": 514.46,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 345.48,
"t": 634.94,
"r": 396.55,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 634.94,
"r": 431.34,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "95.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 634.94,
"r": 475.6,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "90.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 634.82,
"r": 514.47,
"b": 643.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "93.6",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 11,
"page_no": 6,
"cluster": {
"id": 11,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 656.86,
"r": 545.12,
"b": 689.68,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.77,
"r_x1": 341.74,
"r_y1": 665.77,
"r_x2": 341.74,
"r_y2": 656.86,
"r_x3": 308.86,
"r_y3": 656.86,
"coord_origin": "TOPLEFT"
},
"text": "Table 4:",
"orig": "Table 4:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.56,
"r_y0": 665.77,
"r_x1": 545.12,
"r_y1": 665.77,
"r_x2": 545.12,
"r_y2": 656.86,
"r_x3": 349.56,
"r_y3": 656.86,
"coord_origin": "TOPLEFT"
},
"text": "Results of structure with content retrieved using",
"orig": "Results of structure with content retrieved using",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.72,
"r_x1": 545.12,
"r_y1": 677.72,
"r_x2": 545.12,
"r_y2": 668.82,
"r_x3": 308.86,
"r_y3": 668.82,
"coord_origin": "TOPLEFT"
},
"text": "cell detection on PubTabNet. In all cases the input is PDF",
"orig": "cell detection on PubTabNet. In all cases the input is PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.68,
"r_x1": 435.04,
"r_y1": 689.68,
"r_x2": 435.04,
"r_y2": 680.77,
"r_x3": 308.86,
"r_y3": 680.77,
"coord_origin": "TOPLEFT"
},
"text": "documents with cropped tables.",
"orig": "documents with cropped tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables."
},
{
"label": "page_footer",
"id": 14,
"page_no": 6,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.879,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "7"
}
],
"body": [
{
"label": "section_header",
"id": 10,
"page_no": 6,
"cluster": {
"id": 10,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 74.4,
"r": 167.9,
"b": 84.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.25,
"r_x1": 63.7,
"r_y1": 84.25,
"r_x2": 63.7,
"r_y2": 74.4,
"r_x3": 50.11,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3.",
"orig": "5.3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.77,
"r_y0": 84.25,
"r_x1": 167.9,
"r_y1": 84.25,
"r_x2": 167.9,
"r_y2": 74.4,
"r_x3": 72.77,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "Datasets and Metrics",
"orig": "Datasets and Metrics",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.3. Datasets and Metrics"
},
{
"label": "text",
"id": 1,
"page_no": 6,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 93.35,
"r": 286.37,
"b": 138.12,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 102.26,
"r_x1": 286.36,
"r_y1": 102.26,
"r_x2": 286.36,
"r_y2": 93.35,
"r_x3": 62.07,
"r_y3": 93.35,
"coord_origin": "TOPLEFT"
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 114.21,
"r_x1": 286.37,
"r_y1": 114.21,
"r_x2": 286.37,
"r_y2": 105.31,
"r_x3": 50.11,
"r_y3": 105.31,
"coord_origin": "TOPLEFT"
},
"text": "ric was introduced in [37]. It represents the prediction, and",
"orig": "ric was introduced in [37]. It represents the prediction, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 126.17,
"r_x1": 286.37,
"r_y1": 126.17,
"r_x2": 286.37,
"r_y2": 117.26,
"r_x3": 50.11,
"r_y3": 117.26,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth as a tree structure of HTML tags. This simi-",
"orig": "ground-truth as a tree structure of HTML tags. This simi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 138.12,
"r_x1": 136.72,
"r_y1": 138.12,
"r_x2": 136.72,
"r_y2": 129.22,
"r_x3": 50.11,
"r_y3": 129.22,
"coord_origin": "TOPLEFT"
},
"text": "larity is calculated as:",
"orig": "larity is calculated as:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:"
},
{
"label": "formula",
"id": 13,
"page_no": 6,
"cluster": {
"id": 13,
"label": "formula",
"bbox": {
"l": 86.22,
"t": 150.32,
"r": 286.36,
"b": 172.74,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.22,
"r_y0": 165.9,
"r_x1": 118.88,
"r_y1": 165.9,
"r_x2": 118.88,
"r_y2": 157.06,
"r_x3": 86.22,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": "TEDS (",
"orig": "TEDS (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.87,
"r_y0": 165.9,
"r_x1": 143.27,
"r_y1": 165.9,
"r_x2": 143.27,
"r_y2": 157.06,
"r_x3": 118.87,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.77,
"r_y0": 165.9,
"r_x1": 165.9,
"r_y1": 165.9,
"r_x2": 165.9,
"r_y2": 157.06,
"r_x3": 143.77,
"r_y3": 157.06,
"coord_origin": "TOPLEFT"
},
"text": ") = 1",
"orig": ") = 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.12,
"r_y0": 165.9,
"r_x1": 175.87,
"r_y1": 165.9,
"r_x2": 175.87,
"r_y2": 156.5,
"r_x3": 168.12,
"r_y3": 156.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 179.28,
"r_y0": 159.16,
"r_x1": 221.96,
"r_y1": 159.16,
"r_x2": 221.96,
"r_y2": 150.32,
"r_x3": 179.28,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": "EditDist (",
"orig": "EditDist (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.95,
"r_y0": 159.16,
"r_x1": 246.35,
"r_y1": 159.16,
"r_x2": 246.35,
"r_y2": 150.32,
"r_x3": 221.95,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.84,
"r_y0": 159.16,
"r_x1": 250.72,
"r_y1": 159.16,
"r_x2": 250.72,
"r_y2": 150.32,
"r_x3": 246.84,
"r_y3": 150.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.21,
"r_y0": 172.74,
"r_x1": 206.29,
"r_y1": 172.74,
"r_x2": 206.29,
"r_y2": 163.89,
"r_x3": 182.21,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "max (",
"orig": "max (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.29,
"r_y0": 172.74,
"r_x1": 209.06,
"r_y1": 172.74,
"r_x2": 209.06,
"r_y2": 163.33,
"r_x3": 206.29,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.06,
"r_y0": 172.74,
"r_x1": 219.2,
"r_y1": 172.74,
"r_x2": 219.2,
"r_y2": 163.89,
"r_x3": 209.06,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.7,
"r_y0": 172.74,
"r_x1": 222.46,
"r_y1": 172.74,
"r_x2": 222.46,
"r_y2": 163.33,
"r_x3": 219.7,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.12,
"r_y0": 172.74,
"r_x1": 226.89,
"r_y1": 172.74,
"r_x2": 226.89,
"r_y2": 163.89,
"r_x3": 224.12,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.55,
"r_y0": 172.74,
"r_x1": 231.32,
"r_y1": 172.74,
"r_x2": 231.32,
"r_y2": 163.33,
"r_x3": 228.55,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.32,
"r_y0": 172.74,
"r_x1": 240.65,
"r_y1": 172.74,
"r_x2": 240.65,
"r_y2": 163.89,
"r_x3": 231.32,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.14,
"r_y0": 172.74,
"r_x1": 243.91,
"r_y1": 172.74,
"r_x2": 243.91,
"r_y2": 163.33,
"r_x3": 241.14,
"r_y3": 163.33,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.91,
"r_y0": 172.74,
"r_x1": 247.79,
"r_y1": 172.74,
"r_x2": 247.79,
"r_y2": 163.89,
"r_x3": 243.91,
"r_y3": 163.89,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 166.12,
"r_x1": 286.36,
"r_y1": 166.12,
"r_x2": 286.36,
"r_y2": 157.22,
"r_x3": 274.75,
"r_y3": 157.22,
"coord_origin": "TOPLEFT"
},
"text": "(3)",
"orig": "(3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TEDS ( T$_{a}$, T$_{b}$ ) = 1 \u2212 EditDist ( T$_{a}$, T$_{b}$ ) max ( | T$_{a}$ | , | T$_{b}$ | ) (3)"
},
{
"label": "text",
"id": 6,
"page_no": 6,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 50.11,
"t": 181.0,
"r": 286.36,
"b": 213.98,
"coord_origin": "TOPLEFT"
},
"confidence": 0.974,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 190.07,
"r_x1": 86.41,
"r_y1": 190.07,
"r_x2": 86.41,
"r_y2": 181.16,
"r_x3": 62.07,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.58,
"r_y0": 189.85,
"r_x1": 98.72,
"r_y1": 189.85,
"r_x2": 98.72,
"r_y2": 181.0,
"r_x3": 88.58,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.4,
"r_y0": 190.07,
"r_x1": 115.78,
"r_y1": 190.07,
"r_x2": 115.78,
"r_y2": 181.16,
"r_x3": 101.4,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.96,
"r_y0": 189.85,
"r_x1": 127.29,
"r_y1": 189.85,
"r_x2": 127.29,
"r_y2": 181.0,
"r_x3": 117.96,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.96,
"r_y0": 190.07,
"r_x1": 286.36,
"r_y1": 190.07,
"r_x2": 286.36,
"r_y2": 181.16,
"r_x3": 129.96,
"r_y3": 181.16,
"coord_origin": "TOPLEFT"
},
"text": "represent tables in tree structure HTML",
"orig": "represent tables in tree structure HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 202.02,
"r_x1": 252.78,
"r_y1": 202.02,
"r_x2": 252.78,
"r_y2": 193.12,
"r_x3": 50.11,
"r_y3": 193.12,
"coord_origin": "TOPLEFT"
},
"text": "format. EditDist denotes the tree-edit distance, and",
"orig": "format. EditDist denotes the tree-edit distance, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.18,
"r_y0": 201.8,
"r_x1": 257.95,
"r_y1": 201.8,
"r_x2": 257.95,
"r_y2": 192.4,
"r_x3": 255.18,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 257.95,
"r_y0": 201.8,
"r_x1": 263.77,
"r_y1": 201.8,
"r_x2": 263.77,
"r_y2": 192.96,
"r_x3": 257.95,
"r_y3": 192.96,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 265.15,
"r_y0": 201.8,
"r_x1": 267.92,
"r_y1": 201.8,
"r_x2": 267.92,
"r_y2": 192.4,
"r_x3": 265.15,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.32,
"r_y0": 202.02,
"r_x1": 286.36,
"r_y1": 202.02,
"r_x2": 286.36,
"r_y2": 193.12,
"r_x3": 270.32,
"r_y3": 193.12,
"coord_origin": "TOPLEFT"
},
"text": "rep-",
"orig": "rep-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 213.98,
"r_x1": 172.13,
"r_y1": 213.98,
"r_x2": 172.13,
"r_y2": 205.07,
"r_x3": 50.11,
"r_y3": 205.07,
"coord_origin": "TOPLEFT"
},
"text": "resents the number of nodes in",
"orig": "resents the number of nodes in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.62,
"r_y0": 213.76,
"r_x1": 180.45,
"r_y1": 213.76,
"r_x2": 180.45,
"r_y2": 204.91,
"r_x3": 174.62,
"r_y3": 204.91,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.83,
"r_y0": 213.98,
"r_x1": 184.32,
"r_y1": 213.98,
"r_x2": 184.32,
"r_y2": 205.07,
"r_x3": 181.83,
"r_y3": 205.07,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where T$_{a}$ and T$_{b}$ represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ."
},
{
"label": "section_header",
"id": 9,
"page_no": 6,
"cluster": {
"id": 9,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 224.82,
"r": 170.45,
"b": 234.67,
"coord_origin": "TOPLEFT"
},
"confidence": 0.959,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 234.67,
"r_x1": 64.55,
"r_y1": 234.67,
"r_x2": 64.55,
"r_y2": 224.82,
"r_x3": 50.11,
"r_y3": 224.82,
"coord_origin": "TOPLEFT"
},
"text": "5.4.",
"orig": "5.4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.18,
"r_y0": 234.67,
"r_x1": 170.45,
"r_y1": 234.67,
"r_x2": 170.45,
"r_y2": 224.82,
"r_x3": 74.18,
"r_y3": 224.82,
"coord_origin": "TOPLEFT"
},
"text": "Quantitative Analysis",
"orig": "Quantitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.4. Quantitative Analysis"
},
{
"label": "text",
"id": 2,
"page_no": 6,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 243.65,
"r": 286.37,
"b": 396.14,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 252.61,
"r_x1": 105.32,
"r_y1": 252.61,
"r_x2": 105.32,
"r_y2": 243.65,
"r_x3": 62.07,
"r_y3": 243.65,
"coord_origin": "TOPLEFT"
},
"text": "Structure.",
"orig": "Structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.13,
"r_y0": 252.68,
"r_x1": 184.68,
"r_y1": 252.68,
"r_x2": 184.68,
"r_y2": 243.77,
"r_x3": 112.13,
"r_y3": 243.77,
"coord_origin": "TOPLEFT"
},
"text": "As shown in Tab.",
"orig": "As shown in Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 191.48,
"r_y0": 252.68,
"r_x1": 286.36,
"r_y1": 252.68,
"r_x2": 286.36,
"r_y2": 243.77,
"r_x3": 191.48,
"r_y3": 243.77,
"coord_origin": "TOPLEFT"
},
"text": "2, TableFormer outper-",
"orig": "2, TableFormer outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 264.63,
"r_x1": 286.37,
"r_y1": 264.63,
"r_x2": 286.37,
"r_y2": 255.72,
"r_x3": 50.11,
"r_y3": 255.72,
"coord_origin": "TOPLEFT"
},
"text": "forms all SOTA methods across different datasets by a large",
"orig": "forms all SOTA methods across different datasets by a large",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 276.59,
"r_x1": 286.37,
"r_y1": 276.59,
"r_x2": 286.37,
"r_y2": 267.68,
"r_x3": 50.11,
"r_y3": 267.68,
"coord_origin": "TOPLEFT"
},
"text": "margin for predicting the table structure from an image.",
"orig": "margin for predicting the table structure from an image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 288.54,
"r_x1": 286.37,
"r_y1": 288.54,
"r_x2": 286.37,
"r_y2": 279.63,
"r_x3": 50.11,
"r_y3": 279.63,
"coord_origin": "TOPLEFT"
},
"text": "All the more, our model outperforms pre-trained methods.",
"orig": "All the more, our model outperforms pre-trained methods.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.5,
"r_x1": 286.37,
"r_y1": 300.5,
"r_x2": 286.37,
"r_y2": 291.59,
"r_x3": 50.11,
"r_y3": 291.59,
"coord_origin": "TOPLEFT"
},
"text": "During the evaluation we do not apply any table filtering.",
"orig": "During the evaluation we do not apply any table filtering.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.45,
"r_x1": 286.37,
"r_y1": 312.45,
"r_x2": 286.37,
"r_y2": 303.55,
"r_x3": 50.11,
"r_y3": 303.55,
"coord_origin": "TOPLEFT"
},
"text": "We also provide our baseline results on the SynthTabNet",
"orig": "We also provide our baseline results on the SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 324.41,
"r_x1": 286.37,
"r_y1": 324.41,
"r_x2": 286.37,
"r_y2": 315.5,
"r_x3": 50.11,
"r_y3": 315.5,
"coord_origin": "TOPLEFT"
},
"text": "dataset. It has been observed that large tables (e.g. tables",
"orig": "dataset. It has been observed that large tables (e.g. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 336.36,
"r_x1": 286.37,
"r_y1": 336.36,
"r_x2": 286.37,
"r_y2": 327.46,
"r_x3": 50.11,
"r_y3": 327.46,
"coord_origin": "TOPLEFT"
},
"text": "that occupy half of the page or more) yield poor predictions.",
"orig": "that occupy half of the page or more) yield poor predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 348.32,
"r_x1": 286.37,
"r_y1": 348.32,
"r_x2": 286.37,
"r_y2": 339.41,
"r_x3": 50.11,
"r_y3": 339.41,
"coord_origin": "TOPLEFT"
},
"text": "We attribute this issue to the image resizing during the pre-",
"orig": "We attribute this issue to the image resizing during the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 360.27,
"r_x1": 286.37,
"r_y1": 360.27,
"r_x2": 286.37,
"r_y2": 351.37,
"r_x3": 50.11,
"r_y3": 351.37,
"coord_origin": "TOPLEFT"
},
"text": "processing step, that produces downsampled images with",
"orig": "processing step, that produces downsampled images with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 372.23,
"r_x1": 286.37,
"r_y1": 372.23,
"r_x2": 286.37,
"r_y2": 363.32,
"r_x3": 50.11,
"r_y3": 363.32,
"coord_origin": "TOPLEFT"
},
"text": "indistinguishable features. This problem can be addressed",
"orig": "indistinguishable features. This problem can be addressed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 384.18,
"r_x1": 286.37,
"r_y1": 384.18,
"r_x2": 286.37,
"r_y2": 375.28,
"r_x3": 50.11,
"r_y3": 375.28,
"coord_origin": "TOPLEFT"
},
"text": "by treating such big tables with a separate model which ac-",
"orig": "by treating such big tables with a separate model which ac-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 396.14,
"r_x1": 170.01,
"r_y1": 396.14,
"r_x2": 170.01,
"r_y2": 387.23,
"r_x3": 50.11,
"r_y3": 387.23,
"coord_origin": "TOPLEFT"
},
"text": "cepts a large input image size.",
"orig": "cepts a large input image size.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size."
},
{
"label": "table",
"id": 0,
"page_no": 6,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 53.37,
"t": 409.14,
"r": 283.04,
"b": 582.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.989,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 27,
"label": "text",
"bbox": {
"l": 78.84,
"t": 420.69,
"r": 104.86,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.84,
"r_y0": 429.6,
"r_x1": 104.86,
"r_y1": 429.6,
"r_x2": 104.86,
"r_y2": 420.69,
"r_x3": 78.84,
"r_y3": 420.69,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 211.2,
"t": 414.71,
"r": 236.11,
"b": 423.62,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.62,
"r_x1": 236.11,
"r_y1": 423.62,
"r_x2": 236.11,
"r_y2": 414.71,
"r_x3": 211.2,
"r_y3": 414.71,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 129.34,
"t": 426.67,
"r": 159.22,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.34,
"r_y0": 435.57,
"r_x1": 159.22,
"r_y1": 435.57,
"r_x2": 159.22,
"r_y2": 426.67,
"r_x3": 129.34,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 171.17,
"t": 426.67,
"r": 199.4,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.17,
"r_y0": 435.57,
"r_x1": 199.4,
"r_y1": 435.57,
"r_x2": 199.4,
"r_y2": 426.67,
"r_x3": 171.17,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 211.36,
"t": 426.67,
"r": 247.74,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.36,
"r_y0": 435.57,
"r_x1": 247.74,
"r_y1": 435.57,
"r_x2": 247.74,
"r_y2": 426.67,
"r_x3": 211.36,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 264.54,
"t": 426.67,
"r": 277.27,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.54,
"r_y0": 435.57,
"r_x1": 277.27,
"r_y1": 435.57,
"r_x2": 277.27,
"r_y2": 426.67,
"r_x3": 264.54,
"r_y3": 426.67,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 81.61,
"t": 443.62,
"r": 102.09,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 452.53,
"r_x1": 102.09,
"r_y1": 452.53,
"r_x2": 102.09,
"r_y2": 443.62,
"r_x3": 81.61,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 134.87,
"t": 443.62,
"r": 153.69,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 452.53,
"r_x1": 153.69,
"r_y1": 452.53,
"r_x2": 153.69,
"r_y2": 443.62,
"r_x3": 134.87,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 176.57,
"t": 443.62,
"r": 194.0,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 452.53,
"r_x1": 194.0,
"r_y1": 452.53,
"r_x2": 194.0,
"r_y2": 443.62,
"r_x3": 176.57,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 220.83,
"t": 443.62,
"r": 238.26,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 452.53,
"r_x1": 238.26,
"r_y1": 452.53,
"r_x2": 238.26,
"r_y2": 443.62,
"r_x3": 220.83,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 262.18,
"t": 443.62,
"r": 279.62,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 452.53,
"r_x1": 279.62,
"r_y1": 452.53,
"r_x2": 279.62,
"r_y2": 443.62,
"r_x3": 262.18,
"r_y3": 443.62,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 82.17,
"t": 455.58,
"r": 101.53,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 464.49,
"r_x1": 101.53,
"r_y1": 464.49,
"r_x2": 101.53,
"r_y2": 455.58,
"r_x3": 82.17,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 134.87,
"t": 455.58,
"r": 153.69,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 464.49,
"r_x1": 153.69,
"r_y1": 464.49,
"r_x2": 153.69,
"r_y2": 455.58,
"r_x3": 134.87,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 183.62,
"t": 455.58,
"r": 186.94,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 464.49,
"r_x1": 186.94,
"r_y1": 464.49,
"r_x2": 186.94,
"r_y2": 455.58,
"r_x3": 183.62,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 227.89,
"t": 455.58,
"r": 231.21,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 464.49,
"r_x1": 231.21,
"r_y1": 464.49,
"r_x2": 231.21,
"r_y2": 455.58,
"r_x3": 227.89,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 259.7,
"t": 455.58,
"r": 282.11,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.49,
"r_x1": 282.11,
"r_y1": 464.49,
"r_x2": 282.11,
"r_y2": 455.58,
"r_x3": 259.7,
"r_y3": 455.58,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 66.32,
"t": 468.13,
"r": 117.38,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 477.04,
"r_x1": 117.38,
"r_y1": 477.04,
"r_x2": 117.38,
"r_y2": 468.13,
"r_x3": 66.32,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 134.87,
"t": 468.13,
"r": 153.69,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 477.04,
"r_x1": 153.69,
"r_y1": 477.04,
"r_x2": 153.69,
"r_y2": 468.13,
"r_x3": 134.87,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 176.57,
"t": 468.13,
"r": 194.01,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 477.04,
"r_x1": 194.01,
"r_y1": 477.04,
"r_x2": 194.01,
"r_y2": 468.13,
"r_x3": 176.57,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 220.83,
"t": 468.13,
"r": 238.27,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 477.04,
"r_x1": 238.27,
"r_y1": 477.04,
"r_x2": 238.27,
"r_y2": 468.13,
"r_x3": 220.83,
"r_y3": 468.13,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 259.7,
"t": 468.01,
"r": 282.11,
"b": 476.97,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 476.97,
"r_x1": 282.11,
"r_y1": 476.97,
"r_x2": 282.11,
"r_y2": 468.01,
"r_x3": 259.7,
"r_y3": 468.01,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 81.61,
"t": 483.33,
"r": 102.09,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 492.23,
"r_x1": 102.09,
"r_y1": 492.23,
"r_x2": 102.09,
"r_y2": 483.33,
"r_x3": 81.61,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 134.87,
"t": 483.33,
"r": 153.69,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 492.23,
"r_x1": 153.69,
"r_y1": 492.23,
"r_x2": 153.69,
"r_y2": 483.33,
"r_x3": 134.87,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 176.57,
"t": 483.33,
"r": 194.0,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 492.23,
"r_x1": 194.0,
"r_y1": 492.23,
"r_x2": 194.0,
"r_y2": 483.33,
"r_x3": 176.57,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 218.34,
"t": 483.33,
"r": 240.75,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.34,
"r_y0": 492.23,
"r_x1": 240.75,
"r_y1": 492.23,
"r_x2": 240.75,
"r_y2": 483.33,
"r_x3": 218.34,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 262.18,
"t": 483.33,
"r": 279.62,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 492.23,
"r_x1": 279.62,
"r_y1": 492.23,
"r_x2": 279.62,
"r_y2": 483.33,
"r_x3": 262.18,
"r_y3": 483.33,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 82.17,
"t": 495.28,
"r": 101.53,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.17,
"r_y0": 504.19,
"r_x1": 101.53,
"r_y1": 504.19,
"r_x2": 101.53,
"r_y2": 495.28,
"r_x3": 82.17,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 134.87,
"t": 495.28,
"r": 153.69,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 504.19,
"r_x1": 153.69,
"r_y1": 504.19,
"r_x2": 153.69,
"r_y2": 495.28,
"r_x3": 134.87,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 183.62,
"t": 495.28,
"r": 186.94,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.62,
"r_y0": 504.19,
"r_x1": 186.94,
"r_y1": 504.19,
"r_x2": 186.94,
"r_y2": 495.28,
"r_x3": 183.62,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 227.89,
"t": 495.28,
"r": 231.21,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 504.19,
"r_x1": 231.21,
"r_y1": 504.19,
"r_x2": 231.21,
"r_y2": 495.28,
"r_x3": 227.89,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 259.7,
"t": 495.28,
"r": 282.11,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.19,
"r_x1": 282.11,
"r_y1": 504.19,
"r_x2": 282.11,
"r_y2": 495.28,
"r_x3": 259.7,
"r_y3": 495.28,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 71.79,
"t": 507.24,
"r": 111.91,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.79,
"r_y0": 516.14,
"r_x1": 111.91,
"r_y1": 516.14,
"r_x2": 111.91,
"r_y2": 507.24,
"r_x3": 71.79,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 134.86,
"t": 507.24,
"r": 153.68,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.86,
"r_y0": 516.14,
"r_x1": 153.68,
"r_y1": 516.14,
"r_x2": 153.68,
"r_y2": 507.24,
"r_x3": 134.86,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 183.63,
"t": 507.24,
"r": 186.95,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.63,
"r_y0": 516.14,
"r_x1": 186.95,
"r_y1": 516.14,
"r_x2": 186.95,
"r_y2": 507.24,
"r_x3": 183.63,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 227.89,
"t": 507.24,
"r": 231.21,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 516.14,
"r_x1": 231.21,
"r_y1": 516.14,
"r_x2": 231.21,
"r_y2": 507.24,
"r_x3": 227.89,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 259.69,
"t": 507.24,
"r": 282.11,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.69,
"r_y0": 516.14,
"r_x1": 282.11,
"r_y1": 516.14,
"r_x2": 282.11,
"r_y2": 507.24,
"r_x3": 259.69,
"r_y3": 507.24,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 66.32,
"t": 519.19,
"r": 117.38,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 528.1,
"r_x1": 117.38,
"r_y1": 528.1,
"r_x2": 117.38,
"r_y2": 519.19,
"r_x3": 66.32,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 134.87,
"t": 519.19,
"r": 153.69,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 528.1,
"r_x1": 153.69,
"r_y1": 528.1,
"r_x2": 153.69,
"r_y2": 519.19,
"r_x3": 134.87,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 176.57,
"t": 519.19,
"r": 194.01,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 528.1,
"r_x1": 194.01,
"r_y1": 528.1,
"r_x2": 194.01,
"r_y2": 519.19,
"r_x3": 176.57,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 220.83,
"t": 519.19,
"r": 238.27,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 528.1,
"r_x1": 238.27,
"r_y1": 528.1,
"r_x2": 238.27,
"r_y2": 519.19,
"r_x3": 220.83,
"r_y3": 519.19,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 262.19,
"t": 519.07,
"r": 279.62,
"b": 528.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 528.03,
"r_x1": 279.62,
"r_y1": 528.03,
"r_x2": 279.62,
"r_y2": 519.07,
"r_x3": 262.19,
"r_y3": 519.07,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 81.61,
"t": 536.5,
"r": 102.09,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.61,
"r_y0": 545.4,
"r_x1": 102.09,
"r_y1": 545.4,
"r_x2": 102.09,
"r_y2": 536.5,
"r_x3": 81.61,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 137.91,
"t": 536.5,
"r": 150.64,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 545.4,
"r_x1": 150.64,
"r_y1": 545.4,
"r_x2": 150.64,
"r_y2": 536.5,
"r_x3": 137.91,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 176.57,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.57,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 227.89,
"t": 536.5,
"r": 231.21,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 545.4,
"r_x1": 231.21,
"r_y1": 545.4,
"r_x2": 231.21,
"r_y2": 536.5,
"r_x3": 227.89,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 262.18,
"t": 536.5,
"r": 279.62,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.18,
"r_y0": 545.4,
"r_x1": 279.62,
"r_y1": 545.4,
"r_x2": 279.62,
"r_y2": 536.5,
"r_x3": 262.18,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 66.32,
"t": 548.45,
"r": 117.38,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 557.36,
"r_x1": 117.38,
"r_y1": 557.36,
"r_x2": 117.38,
"r_y2": 548.45,
"r_x3": 66.32,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 137.91,
"t": 548.45,
"r": 150.64,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.91,
"r_y0": 557.36,
"r_x1": 150.64,
"r_y1": 557.36,
"r_x2": 150.64,
"r_y2": 548.45,
"r_x3": 137.91,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 176.57,
"t": 548.45,
"r": 194.01,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 557.36,
"r_x1": 194.01,
"r_y1": 557.36,
"r_x2": 194.01,
"r_y2": 548.45,
"r_x3": 176.57,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 227.89,
"t": 548.45,
"r": 231.21,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.89,
"r_y0": 557.36,
"r_x1": 231.21,
"r_y1": 557.36,
"r_x2": 231.21,
"r_y2": 548.45,
"r_x3": 227.89,
"r_y3": 548.45,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 262.19,
"t": 548.33,
"r": 279.62,
"b": 557.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 557.29,
"r_x1": 279.62,
"r_y1": 557.29,
"r_x2": 279.62,
"r_y2": 548.33,
"r_x3": 262.19,
"r_y3": 548.33,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 66.32,
"t": 568.0,
"r": 117.38,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.32,
"r_y0": 576.91,
"r_x1": 117.38,
"r_y1": 576.91,
"r_x2": 117.38,
"r_y2": 568.0,
"r_x3": 66.32,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 134.87,
"t": 568.0,
"r": 153.69,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.87,
"r_y0": 576.91,
"r_x1": 153.69,
"r_y1": 576.91,
"r_x2": 153.69,
"r_y2": 568.0,
"r_x3": 134.87,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 176.57,
"t": 568.0,
"r": 194.01,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.57,
"r_y0": 576.91,
"r_x1": 194.01,
"r_y1": 576.91,
"r_x2": 194.01,
"r_y2": 568.0,
"r_x3": 176.57,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 220.83,
"t": 568.0,
"r": 238.27,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.83,
"r_y0": 576.91,
"r_x1": 238.27,
"r_y1": 576.91,
"r_x2": 238.27,
"r_y2": 568.0,
"r_x3": 220.83,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 262.19,
"t": 568.0,
"r": 279.62,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.19,
"r_y0": 576.91,
"r_x1": 279.62,
"r_y1": 576.91,
"r_x2": 279.62,
"r_y2": 568.0,
"r_x3": 262.19,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 11,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 78.84,
"t": 420.69,
"r": 104.86,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 211.2,
"t": 414.71,
"r": 236.11,
"b": 423.62,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 129.34,
"t": 426.67,
"r": 159.22,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 171.17,
"t": 426.67,
"r": 199.4,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 264.54,
"t": 426.67,
"r": 277.27,
"b": 435.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 443.62,
"r": 102.09,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 443.62,
"r": 153.69,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 443.62,
"r": 194.0,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "91.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 443.62,
"r": 238.26,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 443.62,
"r": 279.62,
"b": 452.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.17,
"t": 455.58,
"r": 101.53,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 455.58,
"r": 153.69,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.62,
"t": 455.58,
"r": 186.94,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 455.58,
"r": 231.21,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 455.58,
"r": 282.11,
"b": 464.49,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "93.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 468.13,
"r": 117.38,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 468.13,
"r": 153.69,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 468.13,
"r": 194.01,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "98.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 468.13,
"r": 238.27,
"b": 477.04,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 468.01,
"r": 282.11,
"b": 476.97,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.75",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 483.33,
"r": 102.09,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 483.33,
"r": 153.69,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 483.33,
"r": 194.0,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "88.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 218.34,
"t": 483.33,
"r": 240.75,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "92.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 483.33,
"r": 279.62,
"b": 492.23,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "90.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.17,
"t": 495.28,
"r": 101.53,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 495.28,
"r": 153.69,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.62,
"t": 495.28,
"r": 186.94,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 495.28,
"r": 231.21,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 495.28,
"r": 282.11,
"b": 504.19,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "87.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 71.79,
"t": 507.24,
"r": 111.91,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE (FT)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.86,
"t": 507.24,
"r": 153.68,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.63,
"t": 507.24,
"r": 186.95,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 507.24,
"r": 231.21,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.69,
"t": 507.24,
"r": 282.11,
"b": 516.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "91.02",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 519.19,
"r": 117.38,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 519.19,
"r": 153.69,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 519.19,
"r": 194.01,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "97.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 519.19,
"r": 238.27,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 519.07,
"r": 279.62,
"b": 528.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.61,
"t": 536.5,
"r": 102.09,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.91,
"t": 536.5,
"r": 150.64,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 536.5,
"r": 231.21,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.18,
"t": 536.5,
"r": 279.62,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 548.45,
"r": 117.38,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.91,
"t": 548.45,
"r": 150.64,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 548.45,
"r": 194.01,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.89,
"t": 548.45,
"r": 231.21,
"b": 557.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 548.33,
"r": 279.62,
"b": 557.29,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.32,
"t": 568.0,
"r": 117.38,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.87,
"t": 568.0,
"r": 153.69,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "STN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.57,
"t": 568.0,
"r": 194.01,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "96.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.83,
"t": 568.0,
"r": 238.27,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.19,
"t": 568.0,
"r": 279.62,
"b": 576.91,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.7",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "text",
"id": 15,
"page_no": 6,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 50.11,
"t": 592.43,
"r": 286.37,
"b": 613.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.721,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 601.34,
"r_x1": 286.37,
"r_y1": 601.34,
"r_x2": 286.37,
"r_y2": 592.43,
"r_x3": 50.11,
"r_y3": 592.43,
"coord_origin": "TOPLEFT"
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 613.29,
"r_x1": 247.46,
"r_y1": 613.29,
"r_x2": 247.46,
"r_y2": 604.39,
"r_x3": 50.11,
"r_y3": 604.39,
"coord_origin": "TOPLEFT"
},
"text": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"orig": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)."
},
{
"label": "text",
"id": 16,
"page_no": 6,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 50.11,
"t": 616.34,
"r": 261.79,
"b": 625.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.643,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 625.25,
"r_x1": 261.79,
"r_y1": 625.25,
"r_x2": 261.79,
"r_y2": 616.34,
"r_x3": 50.11,
"r_y3": 616.34,
"coord_origin": "TOPLEFT"
},
"text": "FT: Model was trained on PubTabNet then finetuned.",
"orig": "FT: Model was trained on PubTabNet then finetuned.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "FT: Model was trained on PubTabNet then finetuned."
},
{
"label": "text",
"id": 3,
"page_no": 6,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 644.35,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 653.31,
"r_x1": 124.72,
"r_y1": 653.31,
"r_x2": 124.72,
"r_y2": 644.35,
"r_x3": 62.07,
"r_y3": 644.35,
"coord_origin": "TOPLEFT"
},
"text": "Cell Detection.",
"orig": "Cell Detection.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.2,
"r_y0": 653.38,
"r_x1": 242.93,
"r_y1": 653.38,
"r_x2": 242.93,
"r_y2": 644.47,
"r_x3": 128.2,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "Like any object detector, our",
"orig": "Like any object detector, our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.55,
"r_y0": 653.15,
"r_x1": 286.36,
"r_y1": 653.15,
"r_x2": 286.36,
"r_y2": 644.56,
"r_x3": 245.55,
"r_y3": 644.56,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.1,
"r_x1": 84.97,
"r_y1": 665.1,
"r_x2": 84.97,
"r_y2": 656.51,
"r_x3": 50.11,
"r_y3": 656.51,
"coord_origin": "TOPLEFT"
},
"text": "Detector",
"orig": "Detector",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.52,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 89.52,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "provides bounding boxes that can be improved",
"orig": "provides bounding boxes that can be improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "with post-processing during inference. We make use of the",
"orig": "with post-processing during inference. We make use of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "grid-like structure of tables to refine the predictions. A de-",
"orig": "grid-like structure of tables to refine the predictions. A de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "tailed explanation on the post-processing is available in the",
"orig": "tailed explanation on the post-processing is available in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 286.37,
"r_y1": 713.15,
"r_x2": 286.37,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "supplementary material. As shown in Tab. 3, we evaluate",
"orig": "supplementary material. As shown in Tab. 3, we evaluate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate"
},
{
"label": "text",
"id": 7,
"page_no": 6,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 308.86,
"t": 75.21,
"r": 545.12,
"b": 227.58,
"coord_origin": "TOPLEFT"
},
"confidence": 0.971,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 84.11,
"r_x1": 322.14,
"r_y1": 84.11,
"r_x2": 322.14,
"r_y2": 75.21,
"r_x3": 308.86,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "our",
"orig": "our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.45,
"r_y0": 83.89,
"r_x1": 404.57,
"r_y1": 83.89,
"r_x2": 404.57,
"r_y2": 75.3,
"r_x3": 325.45,
"r_y3": 75.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 84.11,
"r_x1": 545.11,
"r_y1": 84.11,
"r_x2": 545.11,
"r_y2": 75.21,
"r_x3": 408.1,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "accuracy for cells with a class la-",
"orig": "accuracy for cells with a class la-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 96.07,
"r_x1": 545.12,
"r_y1": 96.07,
"r_x2": 545.12,
"r_y2": 87.16,
"r_x3": 308.86,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 108.02,
"r_x1": 470.23,
"r_y1": 108.02,
"r_x2": 470.23,
"r_y2": 99.12,
"r_x3": 308.86,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "for pre-processing and post-processing.",
"orig": "for pre-processing and post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.53,
"r_y0": 108.02,
"r_x1": 545.12,
"r_y1": 108.02,
"r_x2": 545.12,
"r_y2": 99.12,
"r_x3": 477.53,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "Note that we do",
"orig": "Note that we do",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 119.98,
"r_x1": 545.12,
"r_y1": 119.98,
"r_x2": 545.12,
"r_y2": 111.07,
"r_x3": 308.86,
"r_y3": 111.07,
"coord_origin": "TOPLEFT"
},
"text": "not have post-processing results for SynthTabNet as images",
"orig": "not have post-processing results for SynthTabNet as images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 131.93,
"r_x1": 545.12,
"r_y1": 131.93,
"r_x2": 545.12,
"r_y2": 123.03,
"r_x3": 308.86,
"r_y3": 123.03,
"coord_origin": "TOPLEFT"
},
"text": "are only provided. To compare the performance of our pro-",
"orig": "are only provided. To compare the performance of our pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 143.89,
"r_x1": 502.02,
"r_y1": 143.89,
"r_x2": 502.02,
"r_y2": 134.98,
"r_x3": 308.86,
"r_y3": 134.98,
"coord_origin": "TOPLEFT"
},
"text": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"orig": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 504.47,
"r_y0": 143.66,
"r_x1": 545.11,
"r_y1": 143.66,
"r_x2": 545.11,
"r_y2": 135.07,
"r_x3": 504.47,
"r_y3": 135.07,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 155.62,
"r_x1": 343.16,
"r_y1": 155.62,
"r_x2": 343.16,
"r_y2": 147.03,
"r_x3": 308.86,
"r_y3": 147.03,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.37,
"r_y0": 155.85,
"r_x1": 545.11,
"r_y1": 155.85,
"r_x2": 545.11,
"r_y2": 146.94,
"r_x3": 346.37,
"r_y3": 146.94,
"coord_origin": "TOPLEFT"
},
"text": "into EDD architecture. As mentioned previously,",
"orig": "into EDD architecture. As mentioned previously,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 167.8,
"r_x1": 446.16,
"r_y1": 167.8,
"r_x2": 446.16,
"r_y2": 158.89,
"r_x3": 308.86,
"r_y3": 158.89,
"coord_origin": "TOPLEFT"
},
"text": "the Structure Decoder provides the",
"orig": "the Structure Decoder provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.29,
"r_y0": 167.57,
"r_x1": 525.04,
"r_y1": 167.57,
"r_x2": 525.04,
"r_y2": 158.98,
"r_x3": 448.29,
"r_y3": 158.98,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.4,
"r_y0": 167.8,
"r_x1": 545.11,
"r_y1": 167.8,
"r_x2": 545.11,
"r_y2": 158.89,
"r_x3": 527.4,
"r_y3": 158.89,
"coord_origin": "TOPLEFT"
},
"text": "with",
"orig": "with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 179.76,
"r_x1": 545.12,
"r_y1": 179.76,
"r_x2": 545.12,
"r_y2": 170.85,
"r_x3": 308.86,
"r_y3": 170.85,
"coord_origin": "TOPLEFT"
},
"text": "the features needed to predict the bounding box predictions.",
"orig": "the features needed to predict the bounding box predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 191.71,
"r_x1": 432.87,
"r_y1": 191.71,
"r_x2": 432.87,
"r_y2": 182.8,
"r_x3": 308.86,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "Therefore, the accuracy of the",
"orig": "Therefore, the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.39,
"r_y0": 191.48,
"r_x1": 510.93,
"r_y1": 191.48,
"r_x2": 510.93,
"r_y2": 182.89,
"r_x3": 436.39,
"r_y3": 182.89,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.68,
"r_y0": 191.71,
"r_x1": 545.11,
"r_y1": 191.71,
"r_x2": 545.11,
"r_y2": 182.8,
"r_x3": 514.68,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "directly",
"orig": "directly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 203.67,
"r_x1": 431.17,
"r_y1": 203.67,
"r_x2": 431.17,
"r_y2": 194.76,
"r_x3": 308.86,
"r_y3": 194.76,
"coord_origin": "TOPLEFT"
},
"text": "influences the accuracy of the",
"orig": "influences the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.68,
"r_y0": 203.44,
"r_x1": 514.18,
"r_y1": 203.44,
"r_x2": 514.18,
"r_y2": 194.85,
"r_x3": 434.68,
"r_y3": 194.85,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.18,
"r_y0": 203.67,
"r_x1": 545.11,
"r_y1": 203.67,
"r_x2": 545.11,
"r_y2": 194.76,
"r_x3": 514.18,
"r_y3": 194.76,
"coord_origin": "TOPLEFT"
},
"text": ". If the",
"orig": ". If the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 215.39,
"r_x1": 382.36,
"r_y1": 215.39,
"r_x2": 382.36,
"r_y2": 206.81,
"r_x3": 308.86,
"r_y3": 206.81,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.08,
"r_y0": 215.62,
"r_x1": 545.11,
"r_y1": 215.62,
"r_x2": 545.11,
"r_y2": 206.72,
"r_x3": 385.08,
"r_y3": 206.72,
"coord_origin": "TOPLEFT"
},
"text": "predicts an extra column, this will result",
"orig": "predicts an extra column, this will result",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 227.58,
"r_x1": 501.7,
"r_y1": 227.58,
"r_x2": 501.7,
"r_y2": 218.67,
"r_x3": 308.86,
"r_y3": 218.67,
"coord_origin": "TOPLEFT"
},
"text": "in an extra column of predicted bounding boxes.",
"orig": "in an extra column of predicted bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes."
},
{
"label": "table",
"id": 8,
"page_no": 6,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 308.41,
"t": 247.88,
"r": 533.64,
"b": 303.81,
"coord_origin": "TOPLEFT"
},
"confidence": 0.969,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 339.32,
"t": 253.66,
"r": 365.34,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.32,
"r_y0": 262.57,
"r_x1": 365.34,
"r_y1": 262.57,
"r_x2": 365.34,
"r_y2": 253.66,
"r_x3": 339.32,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 401.04,
"t": 253.66,
"r": 430.92,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.04,
"r_y0": 262.57,
"r_x1": 430.92,
"r_y1": 262.57,
"r_x2": 430.92,
"r_y2": 253.66,
"r_x3": 401.04,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 454.1,
"t": 253.66,
"r": 474.59,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.57,
"r_x1": 474.59,
"r_y1": 262.57,
"r_x2": 474.59,
"r_y2": 253.66,
"r_x3": 454.1,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 486.54,
"t": 253.66,
"r": 527.23,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.54,
"r_y0": 262.57,
"r_x1": 527.23,
"r_y1": 262.57,
"r_x2": 527.23,
"r_y2": 253.66,
"r_x3": 486.54,
"r_y3": 253.66,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 327.66,
"t": 270.62,
"r": 377.0,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.66,
"r_y0": 279.53,
"r_x1": 377.0,
"r_y1": 279.53,
"r_x2": 377.0,
"r_y2": 270.62,
"r_x3": 327.66,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 393.7,
"t": 270.62,
"r": 438.28,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.53,
"r_x1": 438.28,
"r_y1": 279.53,
"r_x2": 438.28,
"r_y2": 270.62,
"r_x3": 393.7,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 455.64,
"t": 270.62,
"r": 473.07,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.64,
"r_y0": 279.53,
"r_x1": 473.07,
"r_y1": 279.53,
"r_x2": 473.07,
"r_y2": 270.62,
"r_x3": 455.64,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 498.17,
"t": 270.62,
"r": 515.6,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 279.53,
"r_x1": 515.6,
"r_y1": 279.53,
"r_x2": 515.6,
"r_y2": 270.62,
"r_x3": 498.17,
"r_y3": 270.62,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.8,
"t": 282.58,
"r": 377.86,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.48,
"r_x1": 377.86,
"r_y1": 291.48,
"r_x2": 377.86,
"r_y2": 282.58,
"r_x3": 326.8,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 393.69,
"t": 282.58,
"r": 438.28,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.69,
"r_y0": 291.48,
"r_x1": 438.28,
"r_y1": 291.48,
"r_x2": 438.28,
"r_y2": 282.58,
"r_x3": 393.69,
"r_y3": 282.58,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 455.63,
"t": 282.46,
"r": 473.07,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 291.41,
"r_x1": 473.07,
"r_y1": 291.41,
"r_x2": 473.07,
"r_y2": 282.46,
"r_x3": 455.63,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 498.17,
"t": 282.46,
"r": 515.61,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.17,
"r_y0": 291.41,
"r_x1": 515.61,
"r_y1": 291.41,
"r_x2": 515.61,
"r_y2": 282.46,
"r_x3": 498.17,
"r_y3": 282.46,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 326.8,
"t": 294.53,
"r": 377.86,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.44,
"r_x1": 377.86,
"r_y1": 303.44,
"r_x2": 377.86,
"r_y2": 294.53,
"r_x3": 326.8,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 389.82,
"t": 294.53,
"r": 442.15,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.82,
"r_y0": 303.44,
"r_x1": 442.15,
"r_y1": 303.44,
"r_x2": 442.15,
"r_y2": 294.53,
"r_x3": 389.82,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 455.63,
"t": 294.53,
"r": 473.07,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.63,
"r_y0": 303.44,
"r_x1": 473.07,
"r_y1": 303.44,
"r_x2": 473.07,
"r_y2": 294.53,
"r_x3": 455.63,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 505.23,
"t": 294.53,
"r": 508.54,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.23,
"r_y0": 303.44,
"r_x1": 508.54,
"r_y1": 303.44,
"r_x2": 508.54,
"r_y2": 294.53,
"r_x3": 505.23,
"r_y3": 294.53,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 4,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 339.32,
"t": 253.66,
"r": 365.34,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 401.04,
"t": 253.66,
"r": 430.92,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 454.1,
"t": 253.66,
"r": 474.59,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "mAP",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 486.54,
"t": 253.66,
"r": 527.23,
"b": 262.57,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "mAP (PP)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 327.66,
"t": 270.62,
"r": 377.0,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD+BBox",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 270.62,
"r": 438.28,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.64,
"t": 270.62,
"r": 473.07,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "79.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.17,
"t": 270.62,
"r": 515.6,
"b": 279.53,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "82.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 282.58,
"r": 377.86,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.69,
"t": 282.58,
"r": 438.28,
"b": 291.48,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.63,
"t": 282.46,
"r": 473.07,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "82.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.17,
"t": 282.46,
"r": 515.61,
"b": 291.41,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "86.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 294.53,
"r": 377.86,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 389.82,
"t": 294.53,
"r": 442.15,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "SynthTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.63,
"t": 294.53,
"r": 473.07,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "87.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 505.23,
"t": 294.53,
"r": 508.54,
"b": 303.44,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 12,
"page_no": 6,
"cluster": {
"id": 12,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 316.45,
"r": 545.12,
"b": 337.31,
"coord_origin": "TOPLEFT"
},
"confidence": 0.952,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 325.36,
"r_x1": 341.5,
"r_y1": 325.36,
"r_x2": 341.5,
"r_y2": 316.45,
"r_x3": 308.86,
"r_y3": 316.45,
"coord_origin": "TOPLEFT"
},
"text": "Table 3:",
"orig": "Table 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.6,
"r_y0": 325.36,
"r_x1": 545.12,
"r_y1": 325.36,
"r_x2": 545.12,
"r_y2": 316.45,
"r_x3": 348.6,
"r_y3": 316.45,
"coord_origin": "TOPLEFT"
},
"text": "Cell Bounding Box detection results on PubTab-",
"orig": "Cell Bounding Box detection results on PubTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 337.31,
"r_x1": 474.98,
"r_y1": 337.31,
"r_x2": 474.98,
"r_y2": 328.4,
"r_x3": 308.86,
"r_y3": 328.4,
"coord_origin": "TOPLEFT"
},
"text": "Net, and FinTabNet. PP: Post-processing.",
"orig": "Net, and FinTabNet. PP: Post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing."
},
{
"label": "text",
"id": 4,
"page_no": 6,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.86,
"t": 367.68,
"r": 545.12,
"b": 520.17,
"coord_origin": "TOPLEFT"
},
"confidence": 0.984,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 376.64,
"r_x1": 378.95,
"r_y1": 376.64,
"r_x2": 378.95,
"r_y2": 367.68,
"r_x3": 320.82,
"r_y3": 367.68,
"coord_origin": "TOPLEFT"
},
"text": "Cell Content.",
"orig": "Cell Content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 387.08,
"r_y0": 376.71,
"r_x1": 545.12,
"r_y1": 376.71,
"r_x2": 545.12,
"r_y2": 367.8,
"r_x3": 387.08,
"r_y3": 367.8,
"coord_origin": "TOPLEFT"
},
"text": "In this section, we evaluate the entire",
"orig": "In this section, we evaluate the entire",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 388.66,
"r_x1": 487.19,
"r_y1": 388.66,
"r_x2": 487.19,
"r_y2": 379.75,
"r_x3": 308.86,
"r_y3": 379.75,
"coord_origin": "TOPLEFT"
},
"text": "pipeline of recovering a table with content.",
"orig": "pipeline of recovering a table with content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.97,
"r_y0": 388.66,
"r_x1": 545.12,
"r_y1": 388.66,
"r_x2": 545.12,
"r_y2": 379.75,
"r_x3": 493.97,
"r_y3": 379.75,
"coord_origin": "TOPLEFT"
},
"text": "Here we put",
"orig": "Here we put",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.62,
"r_x1": 545.12,
"r_y1": 400.62,
"r_x2": 545.12,
"r_y2": 391.71,
"r_x3": 308.86,
"r_y3": 391.71,
"coord_origin": "TOPLEFT"
},
"text": "our approach to test by capitalizing on extracting content",
"orig": "our approach to test by capitalizing on extracting content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.57,
"r_x1": 545.12,
"r_y1": 412.57,
"r_x2": 545.12,
"r_y2": 403.67,
"r_x3": 308.86,
"r_y3": 403.67,
"coord_origin": "TOPLEFT"
},
"text": "from the PDF cells rather than decoding from images. Tab.",
"orig": "from the PDF cells rather than decoding from images. Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.53,
"r_x1": 314.08,
"r_y1": 424.53,
"r_x2": 314.08,
"r_y2": 415.62,
"r_x3": 308.86,
"r_y3": 415.62,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.69,
"r_y0": 424.53,
"r_x1": 545.12,
"r_y1": 424.53,
"r_x2": 545.12,
"r_y2": 415.62,
"r_x3": 316.69,
"r_y3": 415.62,
"coord_origin": "TOPLEFT"
},
"text": "shows the TEDs score of HTML code representing the",
"orig": "shows the TEDs score of HTML code representing the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.48,
"r_x1": 545.12,
"r_y1": 436.48,
"r_x2": 545.12,
"r_y2": 427.58,
"r_x3": 308.86,
"r_y3": 427.58,
"coord_origin": "TOPLEFT"
},
"text": "structure of the table along with the content inserted in the",
"orig": "structure of the table along with the content inserted in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.44,
"r_x1": 545.12,
"r_y1": 448.44,
"r_x2": 545.12,
"r_y2": 439.53,
"r_x3": 308.86,
"r_y3": 439.53,
"coord_origin": "TOPLEFT"
},
"text": "data cell and compared with the ground-truth. Our method",
"orig": "data cell and compared with the ground-truth. Our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 460.39,
"r_x1": 350.24,
"r_y1": 460.39,
"r_x2": 350.24,
"r_y2": 451.49,
"r_x3": 308.86,
"r_y3": 451.49,
"coord_origin": "TOPLEFT"
},
"text": "achieved a",
"orig": "achieved a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.18,
"r_y0": 460.32,
"r_x1": 374.59,
"r_y1": 460.32,
"r_x2": 374.59,
"r_y2": 451.37,
"r_x3": 352.18,
"r_y3": 451.37,
"coord_origin": "TOPLEFT"
},
"text": "5.3%",
"orig": "5.3%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.53,
"r_y0": 460.39,
"r_x1": 545.11,
"r_y1": 460.39,
"r_x2": 545.11,
"r_y2": 451.49,
"r_x3": 376.53,
"r_y3": 451.49,
"coord_origin": "TOPLEFT"
},
"text": "increase over the state-of-the-art, and com-",
"orig": "increase over the state-of-the-art, and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 472.35,
"r_x1": 545.12,
"r_y1": 472.35,
"r_x2": 545.12,
"r_y2": 463.44,
"r_x3": 308.86,
"r_y3": 463.44,
"coord_origin": "TOPLEFT"
},
"text": "mercial solutions. We believe our scores would be higher",
"orig": "mercial solutions. We believe our scores would be higher",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 484.3,
"r_x1": 545.12,
"r_y1": 484.3,
"r_x2": 545.12,
"r_y2": 475.4,
"r_x3": 308.86,
"r_y3": 475.4,
"coord_origin": "TOPLEFT"
},
"text": "if the HTML ground-truth matched the extracted PDF cell",
"orig": "if the HTML ground-truth matched the extracted PDF cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 496.26,
"r_x1": 545.12,
"r_y1": 496.26,
"r_x2": 545.12,
"r_y2": 487.35,
"r_x3": 308.86,
"r_y3": 487.35,
"coord_origin": "TOPLEFT"
},
"text": "content. Unfortunately, there are small discrepancies such",
"orig": "content. Unfortunately, there are small discrepancies such",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 508.21,
"r_x1": 545.12,
"r_y1": 508.21,
"r_x2": 545.12,
"r_y2": 499.31,
"r_x3": 308.86,
"r_y3": 499.31,
"coord_origin": "TOPLEFT"
},
"text": "as spacings around words or special characters with various",
"orig": "as spacings around words or special characters with various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 520.17,
"r_x1": 405.7,
"r_y1": 520.17,
"r_x2": 405.7,
"r_y2": 511.26,
"r_x3": 308.86,
"r_y3": 511.26,
"coord_origin": "TOPLEFT"
},
"text": "unicode representations.",
"orig": "unicode representations.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations."
},
{
"label": "table",
"id": 5,
"page_no": 6,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 332.97,
"t": 540.28,
"r": 520.94,
"b": 643.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 99,
"label": "text",
"bbox": {
"l": 358.01,
"t": 552.23,
"r": 384.02,
"b": 561.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.01,
"r_y0": 561.14,
"r_x1": 384.02,
"r_y1": 561.14,
"r_x2": 384.02,
"r_y2": 552.23,
"r_x3": 358.01,
"r_y3": 552.23,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 449.03,
"t": 546.26,
"r": 473.94,
"b": 555.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.03,
"r_y0": 555.16,
"r_x1": 473.94,
"r_y1": 555.16,
"r_x2": 473.94,
"r_y2": 546.26,
"r_x3": 449.03,
"r_y3": 546.26,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 408.51,
"t": 558.21,
"r": 436.74,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.51,
"r_y0": 567.12,
"r_x1": 436.74,
"r_y1": 567.12,
"r_x2": 436.74,
"r_y2": 558.21,
"r_x3": 408.51,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 448.7,
"t": 558.21,
"r": 485.08,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.12,
"r_x1": 485.08,
"r_y1": 567.12,
"r_x2": 485.08,
"r_y2": 558.21,
"r_x3": 448.7,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 499.38,
"t": 558.21,
"r": 512.12,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.38,
"r_y0": 567.12,
"r_x1": 512.12,
"r_y1": 567.12,
"r_x2": 512.12,
"r_y2": 558.21,
"r_x3": 499.38,
"r_y3": 558.21,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 357.68,
"t": 575.17,
"r": 384.35,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.68,
"r_y0": 584.07,
"r_x1": 384.35,
"r_y1": 584.07,
"r_x2": 384.35,
"r_y2": 575.17,
"r_x3": 357.68,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 413.9,
"t": 575.17,
"r": 431.34,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.07,
"r_x1": 431.34,
"r_y1": 584.07,
"r_x2": 431.34,
"r_y2": 575.17,
"r_x3": 413.9,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 458.16,
"t": 575.17,
"r": 475.6,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.16,
"r_y0": 584.07,
"r_x1": 475.6,
"r_y1": 584.07,
"r_x2": 475.6,
"r_y2": 575.17,
"r_x3": 458.16,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 497.03,
"t": 575.17,
"r": 514.46,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 584.07,
"r_x1": 514.46,
"r_y1": 584.07,
"r_x2": 514.46,
"r_y2": 575.17,
"r_x3": 497.03,
"r_y3": 575.17,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 350.72,
"t": 587.12,
"r": 391.31,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.72,
"r_y0": 596.03,
"r_x1": 391.31,
"r_y1": 596.03,
"r_x2": 391.31,
"r_y2": 587.12,
"r_x3": 350.72,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 413.91,
"t": 587.12,
"r": 431.34,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 596.03,
"r_x1": 431.34,
"r_y1": 596.03,
"r_x2": 431.34,
"r_y2": 587.12,
"r_x3": 413.91,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 458.17,
"t": 587.12,
"r": 475.6,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 596.03,
"r_x1": 475.6,
"r_y1": 596.03,
"r_x2": 475.6,
"r_y2": 587.12,
"r_x3": 458.17,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 497.03,
"t": 587.12,
"r": 514.47,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 596.03,
"r_x1": 514.47,
"r_y1": 596.03,
"r_x2": 514.47,
"r_y2": 587.12,
"r_x3": 497.03,
"r_y3": 587.12,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 354.14,
"t": 599.08,
"r": 387.9,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.14,
"r_y0": 607.98,
"r_x1": 387.9,
"r_y1": 607.98,
"r_x2": 387.9,
"r_y2": 599.08,
"r_x3": 354.14,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 413.9,
"t": 599.08,
"r": 431.34,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 607.98,
"r_x1": 431.34,
"r_y1": 607.98,
"r_x2": 431.34,
"r_y2": 599.08,
"r_x3": 413.9,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 458.17,
"t": 599.08,
"r": 475.6,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 607.98,
"r_x1": 475.6,
"r_y1": 607.98,
"r_x2": 475.6,
"r_y2": 599.08,
"r_x3": 458.17,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 497.03,
"t": 599.08,
"r": 514.46,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 607.98,
"r_x1": 514.46,
"r_y1": 607.98,
"r_x2": 514.46,
"r_y2": 599.08,
"r_x3": 497.03,
"r_y3": 599.08,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 346.56,
"t": 611.03,
"r": 395.48,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.56,
"r_y0": 619.94,
"r_x1": 395.48,
"r_y1": 619.94,
"r_x2": 395.48,
"r_y2": 611.03,
"r_x3": 346.56,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 413.91,
"t": 611.03,
"r": 431.34,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 619.94,
"r_x1": 431.34,
"r_y1": 619.94,
"r_x2": 431.34,
"r_y2": 611.03,
"r_x3": 413.91,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 458.17,
"t": 611.03,
"r": 475.6,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 619.94,
"r_x1": 475.6,
"r_y1": 619.94,
"r_x2": 475.6,
"r_y2": 611.03,
"r_x3": 458.17,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 497.03,
"t": 611.03,
"r": 514.47,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 619.94,
"r_x1": 514.47,
"r_y1": 619.94,
"r_x2": 514.47,
"r_y2": 611.03,
"r_x3": 497.03,
"r_y3": 611.03,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 360.78,
"t": 622.99,
"r": 381.25,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.78,
"r_y0": 631.89,
"r_x1": 381.25,
"r_y1": 631.89,
"r_x2": 381.25,
"r_y2": 622.99,
"r_x3": 360.78,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 413.9,
"t": 622.99,
"r": 431.34,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.89,
"r_x1": 431.34,
"r_y1": 631.89,
"r_x2": 431.34,
"r_y2": 622.99,
"r_x3": 413.9,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 458.17,
"t": 622.99,
"r": 475.6,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 631.89,
"r_x1": 475.6,
"r_y1": 631.89,
"r_x2": 475.6,
"r_y2": 622.99,
"r_x3": 458.17,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 497.03,
"t": 622.99,
"r": 514.46,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 631.89,
"r_x1": 514.46,
"r_y1": 631.89,
"r_x2": 514.46,
"r_y2": 622.99,
"r_x3": 497.03,
"r_y3": 622.99,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 345.48,
"t": 634.94,
"r": 396.55,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.48,
"r_y0": 643.85,
"r_x1": 396.55,
"r_y1": 643.85,
"r_x2": 396.55,
"r_y2": 634.94,
"r_x3": 345.48,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 125,
"label": "text",
"bbox": {
"l": 413.91,
"t": 634.94,
"r": 431.34,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.91,
"r_y0": 643.85,
"r_x1": 431.34,
"r_y1": 643.85,
"r_x2": 431.34,
"r_y2": 634.94,
"r_x3": 413.91,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 458.17,
"t": 634.94,
"r": 475.6,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.17,
"r_y0": 643.85,
"r_x1": 475.6,
"r_y1": 643.85,
"r_x2": 475.6,
"r_y2": 634.94,
"r_x3": 458.17,
"r_y3": 634.94,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 497.03,
"t": 634.82,
"r": 514.47,
"b": 643.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.03,
"r_y0": 643.78,
"r_x1": 514.47,
"r_y1": 643.78,
"r_x2": 514.47,
"r_y2": 634.82,
"r_x3": 497.03,
"r_y3": 634.82,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 358.01,
"t": 552.23,
"r": 384.02,
"b": 561.14,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.03,
"t": 546.26,
"r": 473.94,
"b": 555.16,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 408.51,
"t": 558.21,
"r": 436.74,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 499.38,
"t": 558.21,
"r": 512.12,
"b": 567.12,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 357.68,
"t": 575.17,
"r": 384.35,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Tabula",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 575.17,
"r": 431.34,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "78.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.16,
"t": 575.17,
"r": 475.6,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "57.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 575.17,
"r": 514.46,
"b": 584.07,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "67.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 350.72,
"t": 587.12,
"r": 391.31,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Traprange",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 587.12,
"r": 431.34,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "60.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 587.12,
"r": 475.6,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "49.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 587.12,
"r": 514.47,
"b": 596.03,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "55.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 354.14,
"t": 599.08,
"r": 387.9,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Camelot",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 599.08,
"r": 431.34,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "80.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 599.08,
"r": 475.6,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "66.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 599.08,
"r": 514.46,
"b": 607.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "73.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 346.56,
"t": 611.03,
"r": 395.48,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Acrobat Pro",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 611.03,
"r": 431.34,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "68.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 611.03,
"r": 475.6,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "61.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 611.03,
"r": 514.47,
"b": 619.94,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "65.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 360.78,
"t": 622.99,
"r": 381.25,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 622.99,
"r": 431.34,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "91.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 622.99,
"r": 475.6,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "85.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 622.99,
"r": 514.46,
"b": 631.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 345.48,
"t": 634.94,
"r": 396.55,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.91,
"t": 634.94,
"r": 431.34,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "95.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.17,
"t": 634.94,
"r": 475.6,
"b": 643.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "90.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.03,
"t": 634.82,
"r": 514.47,
"b": 643.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "93.6",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 11,
"page_no": 6,
"cluster": {
"id": 11,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 656.86,
"r": 545.12,
"b": 689.68,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 665.77,
"r_x1": 341.74,
"r_y1": 665.77,
"r_x2": 341.74,
"r_y2": 656.86,
"r_x3": 308.86,
"r_y3": 656.86,
"coord_origin": "TOPLEFT"
},
"text": "Table 4:",
"orig": "Table 4:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.56,
"r_y0": 665.77,
"r_x1": 545.12,
"r_y1": 665.77,
"r_x2": 545.12,
"r_y2": 656.86,
"r_x3": 349.56,
"r_y3": 656.86,
"coord_origin": "TOPLEFT"
},
"text": "Results of structure with content retrieved using",
"orig": "Results of structure with content retrieved using",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 677.72,
"r_x1": 545.12,
"r_y1": 677.72,
"r_x2": 545.12,
"r_y2": 668.82,
"r_x3": 308.86,
"r_y3": 668.82,
"coord_origin": "TOPLEFT"
},
"text": "cell detection on PubTabNet. In all cases the input is PDF",
"orig": "cell detection on PubTabNet. In all cases the input is PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 689.68,
"r_x1": 435.04,
"r_y1": 689.68,
"r_x2": 435.04,
"r_y2": 680.77,
"r_x3": 308.86,
"r_y3": 680.77,
"coord_origin": "TOPLEFT"
},
"text": "documents with cropped tables.",
"orig": "documents with cropped tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables."
}
],
"headers": [
{
"label": "page_footer",
"id": 14,
"page_no": 6,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.879,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "7"
}
]
}
},
{
"page_no": 7,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.81,
"r_y0": 216.11,
"r_x1": 62.22,
"r_y1": 216.11,
"r_x2": 62.22,
"r_y2": 208.23,
"r_x3": 53.81,
"r_y3": 208.23,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.42,
"r_y0": 216.11,
"r_x1": 385.93,
"r_y1": 216.11,
"r_x2": 385.93,
"r_y2": 208.23,
"r_x3": 66.42,
"r_y3": 208.23,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.81,
"r_y0": 102.15,
"r_x1": 284.35,
"r_y1": 102.15,
"r_x2": 284.35,
"r_y2": 94.28,
"r_x3": 53.81,
"r_y3": 94.28,
"coord_origin": "TOPLEFT"
},
"text": "Japanese language (previously unseen by TableFormer):",
"orig": "Japanese language (previously unseen by TableFormer):",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 304.83,
"r_y0": 102.15,
"r_x1": 431.09,
"r_y1": 102.15,
"r_x2": 431.09,
"r_y2": 94.28,
"r_x3": 304.83,
"r_y3": 94.28,
"coord_origin": "TOPLEFT"
},
"text": "Example table from FinTabNet:",
"orig": "Example table from FinTabNet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.29,
"r_y0": 86.56,
"r_x1": 61.55,
"r_y1": 86.56,
"r_x2": 61.55,
"r_y2": 78.69,
"r_x3": 53.29,
"r_y3": 78.69,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.68,
"r_y0": 86.56,
"r_x1": 499.56,
"r_y1": 86.56,
"r_x2": 499.56,
"r_y2": 78.69,
"r_x3": 65.68,
"r_y3": 78.69,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.43,
"r_y0": 298.6,
"r_x1": 549.42,
"r_y1": 298.6,
"r_x2": 549.42,
"r_y2": 292.3,
"r_x3": 380.43,
"r_y3": 292.3,
"coord_origin": "TOPLEFT"
},
"text": "Text is aligned to match original for ease of viewing",
"orig": "Text is aligned to match original for ease of viewing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 329.78,
"r_x1": 86.86,
"r_y1": 329.78,
"r_x2": 86.86,
"r_y2": 320.88,
"r_x3": 50.11,
"r_y3": 320.88,
"coord_origin": "TOPLEFT"
},
"text": "Figure 5:",
"orig": "Figure 5:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.92,
"r_y0": 329.78,
"r_x1": 545.11,
"r_y1": 329.78,
"r_x2": 545.11,
"r_y2": 320.88,
"r_x3": 93.92,
"r_y3": 320.88,
"coord_origin": "TOPLEFT"
},
"text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 341.74,
"r_x1": 545.11,
"r_y1": 341.74,
"r_x2": 545.11,
"r_y2": 332.83,
"r_x3": 50.11,
"r_y3": 332.83,
"coord_origin": "TOPLEFT"
},
"text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 353.69,
"r_x1": 545.11,
"r_y1": 353.69,
"r_x2": 545.11,
"r_y2": 344.79,
"r_x3": 50.11,
"r_y3": 344.79,
"coord_origin": "TOPLEFT"
},
"text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 365.65,
"r_x1": 139.8,
"r_y1": 365.65,
"r_x2": 139.8,
"r_y2": 356.74,
"r_x3": 50.11,
"r_y3": 356.74,
"coord_origin": "TOPLEFT"
},
"text": "the FinTabNet dataset.",
"orig": "the FinTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.26,
"r_y0": 386.44,
"r_x1": 342.08,
"r_y1": 386.44,
"r_x2": 342.08,
"r_y2": 381.78,
"r_x3": 220.26,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.72,
"r_y0": 386.44,
"r_x1": 85.66,
"r_y1": 386.44,
"r_x2": 85.66,
"r_y2": 381.78,
"r_x3": 53.72,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 406.87,
"r_x1": 443.7,
"r_y1": 406.87,
"r_x2": 443.7,
"r_y2": 400.55,
"r_x3": 437.38,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 406.87,
"r_x1": 456.65,
"r_y1": 406.87,
"r_x2": 456.65,
"r_y2": 400.55,
"r_x3": 450.33,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 406.87,
"r_x1": 469.6,
"r_y1": 406.87,
"r_x2": 469.6,
"r_y2": 400.55,
"r_x3": 463.28,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 406.87,
"r_x1": 482.56,
"r_y1": 406.87,
"r_x2": 482.56,
"r_y2": 400.55,
"r_x3": 476.24,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 406.87,
"r_x1": 495.51,
"r_y1": 406.87,
"r_x2": 495.51,
"r_y2": 400.55,
"r_x3": 489.19,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 406.87,
"r_x1": 508.46,
"r_y1": 406.87,
"r_x2": 508.46,
"r_y2": 400.55,
"r_x3": 502.14,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.87,
"r_x1": 521.41,
"r_y1": 406.87,
"r_x2": 521.41,
"r_y2": 400.55,
"r_x3": 515.1,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 417.36,
"r_x1": 391.6,
"r_y1": 417.36,
"r_x2": 391.6,
"r_y2": 411.04,
"r_x3": 385.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 417.36,
"r_x1": 404.84,
"r_y1": 417.36,
"r_x2": 404.84,
"r_y2": 411.04,
"r_x3": 398.52,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 417.36,
"r_x1": 417.8,
"r_y1": 417.36,
"r_x2": 417.8,
"r_y2": 411.04,
"r_x3": 411.48,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 417.36,
"r_x1": 443.7,
"r_y1": 417.36,
"r_x2": 443.7,
"r_y2": 411.04,
"r_x3": 437.38,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 417.36,
"r_x1": 456.65,
"r_y1": 417.36,
"r_x2": 456.65,
"r_y2": 411.04,
"r_x3": 450.33,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 417.36,
"r_x1": 469.6,
"r_y1": 417.36,
"r_x2": 469.6,
"r_y2": 411.04,
"r_x3": 463.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 427.39,
"r_x1": 391.6,
"r_y1": 427.39,
"r_x2": 391.6,
"r_y2": 421.07,
"r_x3": 385.28,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 427.39,
"r_x1": 404.84,
"r_y1": 427.39,
"r_x2": 404.84,
"r_y2": 421.07,
"r_x3": 398.52,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 427.39,
"r_x1": 417.8,
"r_y1": 427.39,
"r_x2": 417.8,
"r_y2": 421.07,
"r_x3": 411.48,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 427.39,
"r_x1": 430.75,
"r_y1": 427.39,
"r_x2": 430.75,
"r_y2": 421.07,
"r_x3": 424.43,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 427.39,
"r_x1": 443.7,
"r_y1": 427.39,
"r_x2": 443.7,
"r_y2": 421.07,
"r_x3": 437.38,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 427.39,
"r_x1": 456.65,
"r_y1": 427.39,
"r_x2": 456.65,
"r_y2": 421.07,
"r_x3": 450.33,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 427.39,
"r_x1": 469.61,
"r_y1": 427.39,
"r_x2": 469.61,
"r_y2": 421.07,
"r_x3": 463.29,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 427.39,
"r_x1": 482.56,
"r_y1": 427.39,
"r_x2": 482.56,
"r_y2": 421.07,
"r_x3": 476.24,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 427.39,
"r_x1": 495.51,
"r_y1": 427.39,
"r_x2": 495.51,
"r_y2": 421.07,
"r_x3": 489.19,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 427.39,
"r_x1": 508.46,
"r_y1": 427.39,
"r_x2": 508.46,
"r_y2": 421.07,
"r_x3": 502.14,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.39,
"r_x1": 521.42,
"r_y1": 427.39,
"r_x2": 521.42,
"r_y2": 421.07,
"r_x3": 515.1,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 427.39,
"r_x1": 534.37,
"r_y1": 427.39,
"r_x2": 534.37,
"r_y2": 421.07,
"r_x3": 528.05,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 438.36,
"r_x1": 391.6,
"r_y1": 438.36,
"r_x2": 391.6,
"r_y2": 432.04,
"r_x3": 385.28,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 438.36,
"r_x1": 404.84,
"r_y1": 438.36,
"r_x2": 404.84,
"r_y2": 432.04,
"r_x3": 398.52,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 438.36,
"r_x1": 417.8,
"r_y1": 438.36,
"r_x2": 417.8,
"r_y2": 432.04,
"r_x3": 411.48,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 438.36,
"r_x1": 430.75,
"r_y1": 438.36,
"r_x2": 430.75,
"r_y2": 432.04,
"r_x3": 424.43,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 438.36,
"r_x1": 443.7,
"r_y1": 438.36,
"r_x2": 443.7,
"r_y2": 432.04,
"r_x3": 437.38,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 438.36,
"r_x1": 456.65,
"r_y1": 438.36,
"r_x2": 456.65,
"r_y2": 432.04,
"r_x3": 450.33,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 438.36,
"r_x1": 469.61,
"r_y1": 438.36,
"r_x2": 469.61,
"r_y2": 432.04,
"r_x3": 463.29,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 438.36,
"r_x1": 482.56,
"r_y1": 438.36,
"r_x2": 482.56,
"r_y2": 432.04,
"r_x3": 476.24,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 438.36,
"r_x1": 495.51,
"r_y1": 438.36,
"r_x2": 495.51,
"r_y2": 432.04,
"r_x3": 489.19,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 438.36,
"r_x1": 508.46,
"r_y1": 438.36,
"r_x2": 508.46,
"r_y2": 432.04,
"r_x3": 502.14,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.36,
"r_x1": 521.42,
"r_y1": 438.36,
"r_x2": 521.42,
"r_y2": 432.04,
"r_x3": 515.1,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 438.36,
"r_x1": 534.37,
"r_y1": 438.36,
"r_x2": 534.37,
"r_y2": 432.04,
"r_x3": 528.05,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 395.52,
"r_x1": 388.44,
"r_y1": 395.52,
"r_x2": 388.44,
"r_y2": 389.2,
"r_x3": 385.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 395.52,
"r_x1": 401.68,
"r_y1": 395.52,
"r_x2": 401.68,
"r_y2": 389.2,
"r_x3": 398.52,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 395.52,
"r_x1": 414.63,
"r_y1": 395.52,
"r_x2": 414.63,
"r_y2": 389.2,
"r_x3": 411.48,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 395.52,
"r_x1": 427.59,
"r_y1": 395.52,
"r_x2": 427.59,
"r_y2": 389.2,
"r_x3": 424.43,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 395.52,
"r_x1": 440.54,
"r_y1": 395.52,
"r_x2": 440.54,
"r_y2": 389.2,
"r_x3": 437.38,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 395.52,
"r_x1": 453.49,
"r_y1": 395.52,
"r_x2": 453.49,
"r_y2": 389.2,
"r_x3": 450.33,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 395.52,
"r_x1": 466.44,
"r_y1": 395.52,
"r_x2": 466.44,
"r_y2": 389.2,
"r_x3": 463.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 395.52,
"r_x1": 479.39,
"r_y1": 395.52,
"r_x2": 479.39,
"r_y2": 389.2,
"r_x3": 476.24,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 395.52,
"r_x1": 492.35,
"r_y1": 395.52,
"r_x2": 492.35,
"r_y2": 389.2,
"r_x3": 489.19,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 395.52,
"r_x1": 505.3,
"r_y1": 395.52,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.14,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.09,
"r_y0": 395.52,
"r_x1": 521.41,
"r_y1": 395.52,
"r_x2": 521.41,
"r_y2": 389.2,
"r_x3": 515.09,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.04,
"r_y0": 395.52,
"r_x1": 534.13,
"r_y1": 395.52,
"r_x2": 534.13,
"r_y2": 389.2,
"r_x3": 528.04,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 405.29,
"r_x1": 391.6,
"r_y1": 405.29,
"r_x2": 391.6,
"r_y2": 398.97,
"r_x3": 385.28,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 405.29,
"r_x1": 404.84,
"r_y1": 405.29,
"r_x2": 404.84,
"r_y2": 398.97,
"r_x3": 398.52,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 405.29,
"r_x1": 417.8,
"r_y1": 405.29,
"r_x2": 417.8,
"r_y2": 398.97,
"r_x3": 411.48,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 413.09,
"r_x1": 430.75,
"r_y1": 413.09,
"r_x2": 430.75,
"r_y2": 406.77,
"r_x3": 424.43,
"r_y3": 406.77,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.87,
"r_y0": 417.31,
"r_x1": 509.19,
"r_y1": 417.31,
"r_x2": 509.19,
"r_y2": 410.99,
"r_x3": 502.87,
"r_y3": 410.99,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.35,
"r_y0": 386.44,
"r_x1": 430.99,
"r_y1": 386.44,
"r_x2": 430.99,
"r_y2": 381.78,
"r_x3": 384.35,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.6,
"r_y0": 467.63,
"r_x1": 532.63,
"r_y1": 467.63,
"r_x2": 532.63,
"r_y2": 458.73,
"r_x3": 62.6,
"r_y3": 458.73,
"coord_origin": "TOPLEFT"
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 501.25,
"r_x1": 64.45,
"r_y1": 501.25,
"r_x2": 64.45,
"r_y2": 491.4,
"r_x3": 50.11,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "5.5.",
"orig": "5.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.01,
"r_y0": 501.25,
"r_x1": 163.76,
"r_y1": 501.25,
"r_x2": 163.76,
"r_y2": 491.4,
"r_x3": 74.01,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "Qualitative Analysis",
"orig": "Qualitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 545.78,
"r_x1": 286.36,
"r_y1": 545.78,
"r_x2": 286.36,
"r_y2": 536.87,
"r_x3": 62.07,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "We showcase several visualizations for the different",
"orig": "We showcase several visualizations for the different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 557.73,
"r_x1": 211.16,
"r_y1": 557.73,
"r_x2": 211.16,
"r_y2": 548.83,
"r_x3": 50.11,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "components of our network on various",
"orig": "components of our network on various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 215.1,
"r_y0": 557.51,
"r_x1": 259.17,
"r_y1": 557.51,
"r_x2": 259.17,
"r_y2": 548.92,
"r_x3": 215.1,
"r_y3": 548.92,
"coord_origin": "TOPLEFT"
},
"text": "\u201ccomplex\u201d",
"orig": "\u201ccomplex\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.12,
"r_y0": 557.73,
"r_x1": 286.36,
"r_y1": 557.73,
"r_x2": 286.36,
"r_y2": 548.83,
"r_x3": 263.12,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "tables",
"orig": "tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 569.69,
"r_x1": 286.37,
"r_y1": 569.69,
"r_x2": 286.37,
"r_y2": 560.78,
"r_x3": 50.11,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "within datasets presented in this work in Fig. 5 and Fig. 6",
"orig": "within datasets presented in this work in Fig. 5 and Fig. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 581.64,
"r_x1": 286.37,
"r_y1": 581.64,
"r_x2": 286.37,
"r_y2": 572.74,
"r_x3": 50.11,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "As it is shown, our model is able to predict bounding boxes",
"orig": "As it is shown, our model is able to predict bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 593.6,
"r_x1": 286.37,
"r_y1": 593.6,
"r_x2": 286.37,
"r_y2": 584.69,
"r_x3": 50.11,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "for all table cells, even for the empty ones. Additionally,",
"orig": "for all table cells, even for the empty ones. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 605.56,
"r_x1": 286.37,
"r_y1": 605.56,
"r_x2": 286.37,
"r_y2": 596.65,
"r_x3": 50.11,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "our post-processing techniques can extract the cell content",
"orig": "our post-processing techniques can extract the cell content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 617.51,
"r_x1": 286.37,
"r_y1": 617.51,
"r_x2": 286.37,
"r_y2": 608.6,
"r_x3": 50.11,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "by matching the predicted bounding boxes to the PDF cells",
"orig": "by matching the predicted bounding boxes to the PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 629.47,
"r_x1": 286.37,
"r_y1": 629.47,
"r_x2": 286.37,
"r_y2": 620.56,
"r_x3": 50.11,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "based on their overlap and spatial proximity. The left part",
"orig": "based on their overlap and spatial proximity. The left part",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 641.42,
"r_x1": 286.37,
"r_y1": 641.42,
"r_x2": 286.37,
"r_y2": 632.51,
"r_x3": 50.11,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "of Fig. 5 demonstrates also the adaptability of our method",
"orig": "of Fig. 5 demonstrates also the adaptability of our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "to any language, as it can successfully extract Japanese",
"orig": "to any language, as it can successfully extract Japanese",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 50.11,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "text, although the training set contains only English content.",
"orig": "text, although the training set contains only English content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "We provide more visualizations including the intermediate",
"orig": "We provide more visualizations including the intermediate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "steps in the supplementary material. Overall these illustra-",
"orig": "steps in the supplementary material. Overall these illustra-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "tions justify the versatility of our method across a diverse",
"orig": "tions justify the versatility of our method across a diverse",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 226.89,
"r_y1": 713.15,
"r_x2": 226.89,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "range of table appearances and content type.",
"orig": "range of table appearances and content type.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 501.46,
"r_x1": 316.07,
"r_y1": 501.46,
"r_x2": 316.07,
"r_y2": 490.71,
"r_x3": 308.86,
"r_y3": 490.71,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.69,
"r_y0": 501.46,
"r_x1": 460.85,
"r_y1": 501.46,
"r_x2": 460.85,
"r_y2": 490.71,
"r_x3": 325.69,
"r_y3": 490.71,
"coord_origin": "TOPLEFT"
},
"text": "Future Work & Conclusion",
"orig": "Future Work & Conclusion",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 521.8,
"r_x1": 545.12,
"r_y1": 521.8,
"r_x2": 545.12,
"r_y2": 512.89,
"r_x3": 320.82,
"r_y3": 512.89,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we presented TableFormer an end-to-end",
"orig": "In this paper, we presented TableFormer an end-to-end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.75,
"r_x1": 545.12,
"r_y1": 533.75,
"r_x2": 545.12,
"r_y2": 524.85,
"r_x3": 308.86,
"r_y3": 524.85,
"coord_origin": "TOPLEFT"
},
"text": "transformer based approach to predict table structures and",
"orig": "transformer based approach to predict table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.71,
"r_x1": 545.12,
"r_y1": 545.71,
"r_x2": 545.12,
"r_y2": 536.8,
"r_x3": 308.86,
"r_y3": 536.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes of cells from an image. This approach en-",
"orig": "bounding boxes of cells from an image. This approach en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.66,
"r_x1": 545.12,
"r_y1": 557.66,
"r_x2": 545.12,
"r_y2": 548.76,
"r_x3": 308.86,
"r_y3": 548.76,
"coord_origin": "TOPLEFT"
},
"text": "ables us to recreate the table structure, and extract the cell",
"orig": "ables us to recreate the table structure, and extract the cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.62,
"r_x1": 545.12,
"r_y1": 569.62,
"r_x2": 545.12,
"r_y2": 560.71,
"r_x3": 308.86,
"r_y3": 560.71,
"coord_origin": "TOPLEFT"
},
"text": "content from PDF or OCR by using bounding boxes. Ad-",
"orig": "content from PDF or OCR by using bounding boxes. Ad-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.57,
"r_x1": 545.12,
"r_y1": 581.57,
"r_x2": 545.12,
"r_y2": 572.67,
"r_x3": 308.86,
"r_y3": 572.67,
"coord_origin": "TOPLEFT"
},
"text": "ditionally, it provides the versatility required in real-world",
"orig": "ditionally, it provides the versatility required in real-world",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.53,
"r_x1": 545.12,
"r_y1": 593.53,
"r_x2": 545.12,
"r_y2": 584.62,
"r_x3": 308.86,
"r_y3": 584.62,
"coord_origin": "TOPLEFT"
},
"text": "scenarios when dealing with various types of PDF docu-",
"orig": "scenarios when dealing with various types of PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.49,
"r_x1": 400.47,
"r_y1": 605.49,
"r_x2": 400.47,
"r_y2": 596.58,
"r_x3": 308.86,
"r_y3": 596.58,
"coord_origin": "TOPLEFT"
},
"text": "ments, and languages.",
"orig": "ments, and languages.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.38,
"r_y0": 605.49,
"r_x1": 545.12,
"r_y1": 605.49,
"r_x2": 545.12,
"r_y2": 596.58,
"r_x3": 408.38,
"r_y3": 596.58,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, our method outper-",
"orig": "Furthermore, our method outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.44,
"r_x1": 545.12,
"r_y1": 617.44,
"r_x2": 545.12,
"r_y2": 608.53,
"r_x3": 308.86,
"r_y3": 608.53,
"coord_origin": "TOPLEFT"
},
"text": "forms all state-of-the-arts with a wide margin. Finally, we",
"orig": "forms all state-of-the-arts with a wide margin. Finally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.4,
"r_x1": 545.12,
"r_y1": 629.4,
"r_x2": 545.12,
"r_y2": 620.49,
"r_x3": 308.86,
"r_y3": 620.49,
"coord_origin": "TOPLEFT"
},
"text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.35,
"r_x1": 545.12,
"r_y1": 641.35,
"r_x2": 545.12,
"r_y2": 632.44,
"r_x3": 308.86,
"r_y3": 632.44,
"coord_origin": "TOPLEFT"
},
"text": "erated dataset that reinforces missing characteristics from",
"orig": "erated dataset that reinforces missing characteristics from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.31,
"r_x1": 365.86,
"r_y1": 653.31,
"r_x2": 365.86,
"r_y2": 644.4,
"r_x3": 308.86,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "other datasets.",
"orig": "other datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 682.85,
"r_x1": 364.41,
"r_y1": 682.85,
"r_x2": 364.41,
"r_y2": 672.1,
"r_x3": 308.86,
"r_y3": 672.1,
"coord_origin": "TOPLEFT"
},
"text": "References",
"orig": "References",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 217,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.35,
"r_y0": 701.98,
"r_x1": 323.81,
"r_y1": 701.98,
"r_x2": 323.81,
"r_y2": 693.96,
"r_x3": 313.35,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "[1]",
"orig": "[1]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 218,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.05,
"r_y0": 701.98,
"r_x1": 545.11,
"r_y1": 701.98,
"r_x2": 545.11,
"r_y2": 693.96,
"r_x3": 326.05,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 219,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 712.94,
"r_x1": 545.11,
"r_y1": 712.94,
"r_x2": 545.11,
"r_y2": 704.92,
"r_x3": 328.78,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 220,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 18,
"label": "caption",
"bbox": {
"l": 53.81,
"t": 208.23,
"r": 385.93,
"b": 216.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.599,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.81,
"r_y0": 216.11,
"r_x1": 62.22,
"r_y1": 216.11,
"r_x2": 62.22,
"r_y2": 208.23,
"r_x3": 53.81,
"r_y3": 208.23,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.42,
"r_y0": 216.11,
"r_x1": 385.93,
"r_y1": 216.11,
"r_x2": 385.93,
"r_y2": 208.23,
"r_x3": 66.42,
"r_y3": 208.23,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "section_header",
"bbox": {
"l": 53.81,
"t": 94.28,
"r": 284.35,
"b": 102.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.465,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.81,
"r_y0": 102.15,
"r_x1": 284.35,
"r_y1": 102.15,
"r_x2": 284.35,
"r_y2": 94.28,
"r_x3": 53.81,
"r_y3": 94.28,
"coord_origin": "TOPLEFT"
},
"text": "Japanese language (previously unseen by TableFormer):",
"orig": "Japanese language (previously unseen by TableFormer):",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "section_header",
"bbox": {
"l": 304.83,
"t": 94.28,
"r": 431.09,
"b": 102.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.463,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 304.83,
"r_y0": 102.15,
"r_x1": 431.09,
"r_y1": 102.15,
"r_x2": 431.09,
"r_y2": 94.28,
"r_x3": 304.83,
"r_y3": 94.28,
"coord_origin": "TOPLEFT"
},
"text": "Example table from FinTabNet:",
"orig": "Example table from FinTabNet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "list_item",
"bbox": {
"l": 53.29,
"t": 78.69,
"r": 61.55,
"b": 86.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.582,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.29,
"r_y0": 86.56,
"r_x1": 61.55,
"r_y1": 86.56,
"r_x2": 61.55,
"r_y2": 78.69,
"r_x3": 53.29,
"r_y3": 78.69,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "list_item",
"bbox": {
"l": 65.68,
"t": 78.69,
"r": 499.56,
"b": 86.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.541,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.68,
"r_y0": 86.56,
"r_x1": 499.56,
"r_y1": 86.56,
"r_x2": 499.56,
"r_y2": 78.69,
"r_x3": 65.68,
"r_y3": 78.69,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 53.63,
"t": 218.95,
"r": 298.56,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 55,
"label": "text",
"bbox": {
"l": 209.93,
"t": 222.18,
"r": 241.04,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 263.76,
"t": 222.18,
"r": 284.51,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 110.25,
"t": 229.67,
"r": 120.62,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 175.37,
"t": 229.67,
"r": 196.11,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 196.11,
"t": 229.67,
"r": 201.29,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 209.62,
"t": 229.67,
"r": 219.99,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 229.2,
"t": 229.67,
"r": 244.75,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 256.11,
"t": 229.67,
"r": 266.48,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 278.38,
"t": 229.67,
"r": 293.94,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 55.53,
"t": 236.43,
"r": 162.71,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 184.4,
"t": 236.43,
"r": 189.56,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 208.99,
"t": 236.43,
"r": 214.16,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 234.88,
"t": 236.43,
"r": 237.46,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 256.88,
"t": 236.43,
"r": 264.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 284.06,
"t": 236.43,
"r": 286.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 55.53,
"t": 242.62,
"r": 139.72,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 183.11,
"t": 242.62,
"r": 190.86,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 207.7,
"t": 242.62,
"r": 215.45,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 234.88,
"t": 242.62,
"r": 237.46,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 256.88,
"t": 242.62,
"r": 264.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 284.06,
"t": 242.62,
"r": 286.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 55.53,
"t": 249.8,
"r": 97.01,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 92.7,
"t": 249.59,
"r": 103.03,
"b": 253.95,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 103.03,
"t": 249.8,
"r": 128.96,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 183.11,
"t": 248.82,
"r": 190.86,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 210.28,
"t": 248.82,
"r": 212.87,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 232.29,
"t": 248.82,
"r": 240.04,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 256.88,
"t": 248.82,
"r": 264.64,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 281.48,
"t": 248.82,
"r": 289.23,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 55.53,
"t": 257.28,
"r": 91.83,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 88.05,
"t": 257.07,
"r": 93.22,
"b": 261.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 93.22,
"t": 257.28,
"r": 119.15,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 116.45,
"t": 257.07,
"r": 129.88,
"b": 261.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 183.11,
"t": 256.3,
"r": 190.86,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 210.28,
"t": 256.3,
"r": 212.87,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 232.29,
"t": 256.3,
"r": 240.04,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 256.88,
"t": 256.3,
"r": 264.64,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 281.48,
"t": 256.3,
"r": 289.23,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 55.53,
"t": 264.51,
"r": 60.72,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 60.18,
"t": 264.3,
"r": 65.34,
"b": 268.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 65.34,
"t": 264.51,
"r": 122.38,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 116.45,
"t": 264.3,
"r": 129.88,
"b": 268.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 183.11,
"t": 263.53,
"r": 190.86,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 210.28,
"t": 263.53,
"r": 212.87,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 232.29,
"t": 263.53,
"r": 240.04,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 256.88,
"t": 263.53,
"r": 264.64,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 281.48,
"t": 263.53,
"r": 289.23,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 55.53,
"t": 271.74,
"r": 107.38,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 101.99,
"t": 271.53,
"r": 109.74,
"b": 275.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 109.74,
"t": 271.74,
"r": 114.93,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 114.39,
"t": 271.53,
"r": 122.14,
"b": 275.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 122.14,
"t": 271.74,
"r": 127.32,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 184.4,
"t": 270.75,
"r": 189.56,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 210.28,
"t": 270.75,
"r": 212.87,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 233.58,
"t": 270.75,
"r": 238.75,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 256.88,
"t": 270.75,
"r": 264.64,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 281.48,
"t": 270.75,
"r": 289.23,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 55.53,
"t": 279.01,
"r": 68.69,
"b": 283.37,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 68.69,
"t": 279.22,
"r": 110.17,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 183.11,
"t": 277.98,
"r": 190.86,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 208.99,
"t": 277.98,
"r": 214.16,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 233.58,
"t": 277.98,
"r": 238.75,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 256.88,
"t": 277.98,
"r": 264.64,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 282.77,
"t": 277.98,
"r": 287.94,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 169.62,
"t": 286.45,
"r": 174.8,
"b": 290.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 183.11,
"t": 285.47,
"r": 190.86,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 207.7,
"t": 285.47,
"r": 215.45,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 232.29,
"t": 285.47,
"r": 240.04,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 255.77,
"t": 285.47,
"r": 265.75,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 281.48,
"t": 285.47,
"r": 289.23,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 16,
"label": "caption",
"bbox": {
"l": 380.43,
"t": 292.3,
"r": 549.42,
"b": 298.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.43,
"r_y0": 298.6,
"r_x1": 549.42,
"r_y1": 298.6,
"r_x2": 549.42,
"r_y2": 292.3,
"r_x3": 380.43,
"r_y3": 292.3,
"coord_origin": "TOPLEFT"
},
"text": "Text is aligned to match original for ease of viewing",
"orig": "Text is aligned to match original for ease of viewing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "table",
"bbox": {
"l": 304.92,
"t": 218.51,
"r": 550.23,
"b": 287.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 125,
"label": "text",
"bbox": {
"l": 459.05,
"t": 221.62,
"r": 542.0,
"b": 226.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 493.82,
"t": 227.83,
"r": 507.23,
"b": 232.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 393.24,
"t": 236.75,
"r": 400.75,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 128,
"label": "text",
"bbox": {
"l": 400.75,
"t": 236.75,
"r": 404.65,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 129,
"label": "text",
"bbox": {
"l": 404.65,
"t": 236.75,
"r": 407.35,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 130,
"label": "text",
"bbox": {
"l": 392.1,
"t": 221.57,
"r": 438.01,
"b": 226.64,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 131,
"label": "text",
"bbox": {
"l": 427.18,
"t": 236.75,
"r": 440.99,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 132,
"label": "text",
"bbox": {
"l": 468.38,
"t": 236.75,
"r": 482.48,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 133,
"label": "text",
"bbox": {
"l": 516.93,
"t": 236.75,
"r": 530.73,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 134,
"label": "text",
"bbox": {
"l": 306.11,
"t": 244.61,
"r": 355.65,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 135,
"label": "text",
"bbox": {
"l": 355.65,
"t": 244.61,
"r": 364.66,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 136,
"label": "text",
"bbox": {
"l": 396.25,
"t": 244.91,
"r": 400.75,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 137,
"label": "text",
"bbox": {
"l": 400.75,
"t": 244.91,
"r": 403.76,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 138,
"label": "text",
"bbox": {
"l": 429.82,
"t": 244.91,
"r": 437.33,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 139,
"label": "text",
"bbox": {
"l": 465.53,
"t": 244.91,
"r": 478.4,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 140,
"label": "text",
"bbox": {
"l": 480.98,
"t": 244.91,
"r": 483.55,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 141,
"label": "text",
"bbox": {
"l": 513.45,
"t": 244.91,
"r": 531.47,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 142,
"label": "text",
"bbox": {
"l": 306.11,
"t": 253.68,
"r": 325.63,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 143,
"label": "text",
"bbox": {
"l": 396.25,
"t": 253.68,
"r": 400.75,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 144,
"label": "text",
"bbox": {
"l": 400.75,
"t": 253.68,
"r": 403.76,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 145,
"label": "text",
"bbox": {
"l": 429.82,
"t": 253.68,
"r": 437.33,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 146,
"label": "text",
"bbox": {
"l": 466.44,
"t": 253.68,
"r": 482.55,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 147,
"label": "text",
"bbox": {
"l": 514.29,
"t": 253.68,
"r": 530.81,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 148,
"label": "text",
"bbox": {
"l": 306.11,
"t": 261.55,
"r": 322.63,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 149,
"label": "text",
"bbox": {
"l": 394.43,
"t": 261.55,
"r": 400.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 150,
"label": "text",
"bbox": {
"l": 400.73,
"t": 261.55,
"r": 403.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 151,
"label": "text",
"bbox": {
"l": 403.74,
"t": 261.55,
"r": 405.54,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 152,
"label": "text",
"bbox": {
"l": 427.7,
"t": 261.55,
"r": 438.81,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 153,
"label": "text",
"bbox": {
"l": 468.56,
"t": 261.55,
"r": 482.07,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 154,
"label": "text",
"bbox": {
"l": 516.02,
"t": 261.55,
"r": 529.53,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 155,
"label": "text",
"bbox": {
"l": 306.11,
"t": 269.64,
"r": 356.25,
"b": 274.71,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 156,
"label": "text",
"bbox": {
"l": 394.43,
"t": 270.32,
"r": 400.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 157,
"label": "text",
"bbox": {
"l": 400.73,
"t": 270.32,
"r": 403.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 158,
"label": "text",
"bbox": {
"l": 403.74,
"t": 270.32,
"r": 405.54,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 159,
"label": "text",
"bbox": {
"l": 431.03,
"t": 270.32,
"r": 436.43,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 160,
"label": "text",
"bbox": {
"l": 465.83,
"t": 270.32,
"r": 482.35,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 161,
"label": "text",
"bbox": {
"l": 516.02,
"t": 270.32,
"r": 529.53,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 162,
"label": "text",
"bbox": {
"l": 306.11,
"t": 278.49,
"r": 373.36,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 163,
"label": "text",
"bbox": {
"l": 396.25,
"t": 278.49,
"r": 403.76,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 164,
"label": "text",
"bbox": {
"l": 429.52,
"t": 278.49,
"r": 437.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 165,
"label": "text",
"bbox": {
"l": 463.71,
"t": 278.49,
"r": 484.74,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 166,
"label": "text",
"bbox": {
"l": 512.99,
"t": 278.49,
"r": 534.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 6,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 320.88,
"r": 545.11,
"b": 365.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.914,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 329.78,
"r_x1": 86.86,
"r_y1": 329.78,
"r_x2": 86.86,
"r_y2": 320.88,
"r_x3": 50.11,
"r_y3": 320.88,
"coord_origin": "TOPLEFT"
},
"text": "Figure 5:",
"orig": "Figure 5:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.92,
"r_y0": 329.78,
"r_x1": 545.11,
"r_y1": 329.78,
"r_x2": 545.11,
"r_y2": 320.88,
"r_x3": 93.92,
"r_y3": 320.88,
"coord_origin": "TOPLEFT"
},
"text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 341.74,
"r_x1": 545.11,
"r_y1": 341.74,
"r_x2": 545.11,
"r_y2": 332.83,
"r_x3": 50.11,
"r_y3": 332.83,
"coord_origin": "TOPLEFT"
},
"text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 353.69,
"r_x1": 545.11,
"r_y1": 353.69,
"r_x2": 545.11,
"r_y2": 344.79,
"r_x3": 50.11,
"r_y3": 344.79,
"coord_origin": "TOPLEFT"
},
"text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 365.65,
"r_x1": 139.8,
"r_y1": 365.65,
"r_x2": 139.8,
"r_y2": 356.74,
"r_x3": 50.11,
"r_y3": 356.74,
"coord_origin": "TOPLEFT"
},
"text": "the FinTabNet dataset.",
"orig": "the FinTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "picture",
"bbox": {
"l": 216.77,
"t": 380.49,
"r": 375.78,
"b": 443.35,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.26,
"r_y0": 386.44,
"r_x1": 342.08,
"r_y1": 386.44,
"r_x2": 342.08,
"r_y2": 381.78,
"r_x3": 220.26,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 167,
"label": "text",
"bbox": {
"l": 220.26,
"t": 381.78,
"r": 342.08,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.26,
"r_y0": 386.44,
"r_x1": 342.08,
"r_y1": 386.44,
"r_x2": 342.08,
"r_y2": 381.78,
"r_x3": 220.26,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 11,
"label": "picture",
"bbox": {
"l": 51.74,
"t": 380.48,
"r": 211.84,
"b": 443.66,
"coord_origin": "TOPLEFT"
},
"confidence": 0.831,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.72,
"r_y0": 386.44,
"r_x1": 85.66,
"r_y1": 386.44,
"r_x2": 85.66,
"r_y2": 381.78,
"r_x3": 53.72,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 168,
"label": "text",
"bbox": {
"l": 53.72,
"t": 381.78,
"r": 85.66,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.72,
"r_y0": 386.44,
"r_x1": 85.66,
"r_y1": 386.44,
"r_x2": 85.66,
"r_y2": 381.78,
"r_x3": 53.72,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 13,
"label": "picture",
"bbox": {
"l": 383.14,
"t": 381.23,
"r": 542.11,
"b": 442.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.788,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 406.87,
"r_x1": 443.7,
"r_y1": 406.87,
"r_x2": 443.7,
"r_y2": 400.55,
"r_x3": 437.38,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 406.87,
"r_x1": 456.65,
"r_y1": 406.87,
"r_x2": 456.65,
"r_y2": 400.55,
"r_x3": 450.33,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 406.87,
"r_x1": 469.6,
"r_y1": 406.87,
"r_x2": 469.6,
"r_y2": 400.55,
"r_x3": 463.28,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 406.87,
"r_x1": 482.56,
"r_y1": 406.87,
"r_x2": 482.56,
"r_y2": 400.55,
"r_x3": 476.24,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 406.87,
"r_x1": 495.51,
"r_y1": 406.87,
"r_x2": 495.51,
"r_y2": 400.55,
"r_x3": 489.19,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 406.87,
"r_x1": 508.46,
"r_y1": 406.87,
"r_x2": 508.46,
"r_y2": 400.55,
"r_x3": 502.14,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.87,
"r_x1": 521.41,
"r_y1": 406.87,
"r_x2": 521.41,
"r_y2": 400.55,
"r_x3": 515.1,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 417.36,
"r_x1": 391.6,
"r_y1": 417.36,
"r_x2": 391.6,
"r_y2": 411.04,
"r_x3": 385.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 417.36,
"r_x1": 404.84,
"r_y1": 417.36,
"r_x2": 404.84,
"r_y2": 411.04,
"r_x3": 398.52,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 417.36,
"r_x1": 417.8,
"r_y1": 417.36,
"r_x2": 417.8,
"r_y2": 411.04,
"r_x3": 411.48,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 417.36,
"r_x1": 443.7,
"r_y1": 417.36,
"r_x2": 443.7,
"r_y2": 411.04,
"r_x3": 437.38,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 417.36,
"r_x1": 456.65,
"r_y1": 417.36,
"r_x2": 456.65,
"r_y2": 411.04,
"r_x3": 450.33,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 417.36,
"r_x1": 469.6,
"r_y1": 417.36,
"r_x2": 469.6,
"r_y2": 411.04,
"r_x3": 463.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 427.39,
"r_x1": 391.6,
"r_y1": 427.39,
"r_x2": 391.6,
"r_y2": 421.07,
"r_x3": 385.28,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 427.39,
"r_x1": 404.84,
"r_y1": 427.39,
"r_x2": 404.84,
"r_y2": 421.07,
"r_x3": 398.52,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 427.39,
"r_x1": 417.8,
"r_y1": 427.39,
"r_x2": 417.8,
"r_y2": 421.07,
"r_x3": 411.48,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 427.39,
"r_x1": 430.75,
"r_y1": 427.39,
"r_x2": 430.75,
"r_y2": 421.07,
"r_x3": 424.43,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 427.39,
"r_x1": 443.7,
"r_y1": 427.39,
"r_x2": 443.7,
"r_y2": 421.07,
"r_x3": 437.38,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 427.39,
"r_x1": 456.65,
"r_y1": 427.39,
"r_x2": 456.65,
"r_y2": 421.07,
"r_x3": 450.33,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 427.39,
"r_x1": 469.61,
"r_y1": 427.39,
"r_x2": 469.61,
"r_y2": 421.07,
"r_x3": 463.29,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 427.39,
"r_x1": 482.56,
"r_y1": 427.39,
"r_x2": 482.56,
"r_y2": 421.07,
"r_x3": 476.24,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 427.39,
"r_x1": 495.51,
"r_y1": 427.39,
"r_x2": 495.51,
"r_y2": 421.07,
"r_x3": 489.19,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 427.39,
"r_x1": 508.46,
"r_y1": 427.39,
"r_x2": 508.46,
"r_y2": 421.07,
"r_x3": 502.14,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.39,
"r_x1": 521.42,
"r_y1": 427.39,
"r_x2": 521.42,
"r_y2": 421.07,
"r_x3": 515.1,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 427.39,
"r_x1": 534.37,
"r_y1": 427.39,
"r_x2": 534.37,
"r_y2": 421.07,
"r_x3": 528.05,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 438.36,
"r_x1": 391.6,
"r_y1": 438.36,
"r_x2": 391.6,
"r_y2": 432.04,
"r_x3": 385.28,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 438.36,
"r_x1": 404.84,
"r_y1": 438.36,
"r_x2": 404.84,
"r_y2": 432.04,
"r_x3": 398.52,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 438.36,
"r_x1": 417.8,
"r_y1": 438.36,
"r_x2": 417.8,
"r_y2": 432.04,
"r_x3": 411.48,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 438.36,
"r_x1": 430.75,
"r_y1": 438.36,
"r_x2": 430.75,
"r_y2": 432.04,
"r_x3": 424.43,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 438.36,
"r_x1": 443.7,
"r_y1": 438.36,
"r_x2": 443.7,
"r_y2": 432.04,
"r_x3": 437.38,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 438.36,
"r_x1": 456.65,
"r_y1": 438.36,
"r_x2": 456.65,
"r_y2": 432.04,
"r_x3": 450.33,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 438.36,
"r_x1": 469.61,
"r_y1": 438.36,
"r_x2": 469.61,
"r_y2": 432.04,
"r_x3": 463.29,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 438.36,
"r_x1": 482.56,
"r_y1": 438.36,
"r_x2": 482.56,
"r_y2": 432.04,
"r_x3": 476.24,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 438.36,
"r_x1": 495.51,
"r_y1": 438.36,
"r_x2": 495.51,
"r_y2": 432.04,
"r_x3": 489.19,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 438.36,
"r_x1": 508.46,
"r_y1": 438.36,
"r_x2": 508.46,
"r_y2": 432.04,
"r_x3": 502.14,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.36,
"r_x1": 521.42,
"r_y1": 438.36,
"r_x2": 521.42,
"r_y2": 432.04,
"r_x3": 515.1,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 438.36,
"r_x1": 534.37,
"r_y1": 438.36,
"r_x2": 534.37,
"r_y2": 432.04,
"r_x3": 528.05,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 395.52,
"r_x1": 388.44,
"r_y1": 395.52,
"r_x2": 388.44,
"r_y2": 389.2,
"r_x3": 385.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 395.52,
"r_x1": 401.68,
"r_y1": 395.52,
"r_x2": 401.68,
"r_y2": 389.2,
"r_x3": 398.52,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 395.52,
"r_x1": 414.63,
"r_y1": 395.52,
"r_x2": 414.63,
"r_y2": 389.2,
"r_x3": 411.48,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 395.52,
"r_x1": 427.59,
"r_y1": 395.52,
"r_x2": 427.59,
"r_y2": 389.2,
"r_x3": 424.43,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 395.52,
"r_x1": 440.54,
"r_y1": 395.52,
"r_x2": 440.54,
"r_y2": 389.2,
"r_x3": 437.38,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 395.52,
"r_x1": 453.49,
"r_y1": 395.52,
"r_x2": 453.49,
"r_y2": 389.2,
"r_x3": 450.33,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 395.52,
"r_x1": 466.44,
"r_y1": 395.52,
"r_x2": 466.44,
"r_y2": 389.2,
"r_x3": 463.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 395.52,
"r_x1": 479.39,
"r_y1": 395.52,
"r_x2": 479.39,
"r_y2": 389.2,
"r_x3": 476.24,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 395.52,
"r_x1": 492.35,
"r_y1": 395.52,
"r_x2": 492.35,
"r_y2": 389.2,
"r_x3": 489.19,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 395.52,
"r_x1": 505.3,
"r_y1": 395.52,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.14,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.09,
"r_y0": 395.52,
"r_x1": 521.41,
"r_y1": 395.52,
"r_x2": 521.41,
"r_y2": 389.2,
"r_x3": 515.09,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.04,
"r_y0": 395.52,
"r_x1": 534.13,
"r_y1": 395.52,
"r_x2": 534.13,
"r_y2": 389.2,
"r_x3": 528.04,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 405.29,
"r_x1": 391.6,
"r_y1": 405.29,
"r_x2": 391.6,
"r_y2": 398.97,
"r_x3": 385.28,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 405.29,
"r_x1": 404.84,
"r_y1": 405.29,
"r_x2": 404.84,
"r_y2": 398.97,
"r_x3": 398.52,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 405.29,
"r_x1": 417.8,
"r_y1": 405.29,
"r_x2": 417.8,
"r_y2": 398.97,
"r_x3": 411.48,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 413.09,
"r_x1": 430.75,
"r_y1": 413.09,
"r_x2": 430.75,
"r_y2": 406.77,
"r_x3": 424.43,
"r_y3": 406.77,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.87,
"r_y0": 417.31,
"r_x1": 509.19,
"r_y1": 417.31,
"r_x2": 509.19,
"r_y2": 410.99,
"r_x3": 502.87,
"r_y3": 410.99,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.35,
"r_y0": 386.44,
"r_x1": 430.99,
"r_y1": 386.44,
"r_x2": 430.99,
"r_y2": 381.78,
"r_x3": 384.35,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 169,
"label": "text",
"bbox": {
"l": 437.38,
"t": 400.55,
"r": 443.7,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 406.87,
"r_x1": 443.7,
"r_y1": 406.87,
"r_x2": 443.7,
"r_y2": 400.55,
"r_x3": 437.38,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 170,
"label": "text",
"bbox": {
"l": 450.33,
"t": 400.55,
"r": 456.65,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 406.87,
"r_x1": 456.65,
"r_y1": 406.87,
"r_x2": 456.65,
"r_y2": 400.55,
"r_x3": 450.33,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 171,
"label": "text",
"bbox": {
"l": 463.28,
"t": 400.55,
"r": 469.6,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 406.87,
"r_x1": 469.6,
"r_y1": 406.87,
"r_x2": 469.6,
"r_y2": 400.55,
"r_x3": 463.28,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 172,
"label": "text",
"bbox": {
"l": 476.24,
"t": 400.55,
"r": 482.56,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 406.87,
"r_x1": 482.56,
"r_y1": 406.87,
"r_x2": 482.56,
"r_y2": 400.55,
"r_x3": 476.24,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 173,
"label": "text",
"bbox": {
"l": 489.19,
"t": 400.55,
"r": 495.51,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 406.87,
"r_x1": 495.51,
"r_y1": 406.87,
"r_x2": 495.51,
"r_y2": 400.55,
"r_x3": 489.19,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 174,
"label": "text",
"bbox": {
"l": 502.14,
"t": 400.55,
"r": 508.46,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 406.87,
"r_x1": 508.46,
"r_y1": 406.87,
"r_x2": 508.46,
"r_y2": 400.55,
"r_x3": 502.14,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 175,
"label": "text",
"bbox": {
"l": 515.1,
"t": 400.55,
"r": 521.41,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.87,
"r_x1": 521.41,
"r_y1": 406.87,
"r_x2": 521.41,
"r_y2": 400.55,
"r_x3": 515.1,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 176,
"label": "text",
"bbox": {
"l": 385.28,
"t": 411.04,
"r": 391.6,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 417.36,
"r_x1": 391.6,
"r_y1": 417.36,
"r_x2": 391.6,
"r_y2": 411.04,
"r_x3": 385.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 177,
"label": "text",
"bbox": {
"l": 398.52,
"t": 411.04,
"r": 404.84,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 417.36,
"r_x1": 404.84,
"r_y1": 417.36,
"r_x2": 404.84,
"r_y2": 411.04,
"r_x3": 398.52,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 178,
"label": "text",
"bbox": {
"l": 411.48,
"t": 411.04,
"r": 417.8,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 417.36,
"r_x1": 417.8,
"r_y1": 417.36,
"r_x2": 417.8,
"r_y2": 411.04,
"r_x3": 411.48,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 179,
"label": "text",
"bbox": {
"l": 437.38,
"t": 411.04,
"r": 443.7,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 417.36,
"r_x1": 443.7,
"r_y1": 417.36,
"r_x2": 443.7,
"r_y2": 411.04,
"r_x3": 437.38,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 180,
"label": "text",
"bbox": {
"l": 450.33,
"t": 411.04,
"r": 456.65,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 417.36,
"r_x1": 456.65,
"r_y1": 417.36,
"r_x2": 456.65,
"r_y2": 411.04,
"r_x3": 450.33,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 181,
"label": "text",
"bbox": {
"l": 463.28,
"t": 411.04,
"r": 469.6,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 417.36,
"r_x1": 469.6,
"r_y1": 417.36,
"r_x2": 469.6,
"r_y2": 411.04,
"r_x3": 463.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 182,
"label": "text",
"bbox": {
"l": 385.28,
"t": 421.07,
"r": 391.6,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 427.39,
"r_x1": 391.6,
"r_y1": 427.39,
"r_x2": 391.6,
"r_y2": 421.07,
"r_x3": 385.28,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 183,
"label": "text",
"bbox": {
"l": 398.52,
"t": 421.07,
"r": 404.84,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 427.39,
"r_x1": 404.84,
"r_y1": 427.39,
"r_x2": 404.84,
"r_y2": 421.07,
"r_x3": 398.52,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 184,
"label": "text",
"bbox": {
"l": 411.48,
"t": 421.07,
"r": 417.8,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 427.39,
"r_x1": 417.8,
"r_y1": 427.39,
"r_x2": 417.8,
"r_y2": 421.07,
"r_x3": 411.48,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 185,
"label": "text",
"bbox": {
"l": 424.43,
"t": 421.07,
"r": 430.75,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 427.39,
"r_x1": 430.75,
"r_y1": 427.39,
"r_x2": 430.75,
"r_y2": 421.07,
"r_x3": 424.43,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 186,
"label": "text",
"bbox": {
"l": 437.38,
"t": 421.07,
"r": 443.7,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 427.39,
"r_x1": 443.7,
"r_y1": 427.39,
"r_x2": 443.7,
"r_y2": 421.07,
"r_x3": 437.38,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 187,
"label": "text",
"bbox": {
"l": 450.33,
"t": 421.07,
"r": 456.65,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 427.39,
"r_x1": 456.65,
"r_y1": 427.39,
"r_x2": 456.65,
"r_y2": 421.07,
"r_x3": 450.33,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 188,
"label": "text",
"bbox": {
"l": 463.29,
"t": 421.07,
"r": 469.61,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 427.39,
"r_x1": 469.61,
"r_y1": 427.39,
"r_x2": 469.61,
"r_y2": 421.07,
"r_x3": 463.29,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 189,
"label": "text",
"bbox": {
"l": 476.24,
"t": 421.07,
"r": 482.56,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 427.39,
"r_x1": 482.56,
"r_y1": 427.39,
"r_x2": 482.56,
"r_y2": 421.07,
"r_x3": 476.24,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 190,
"label": "text",
"bbox": {
"l": 489.19,
"t": 421.07,
"r": 495.51,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 427.39,
"r_x1": 495.51,
"r_y1": 427.39,
"r_x2": 495.51,
"r_y2": 421.07,
"r_x3": 489.19,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 191,
"label": "text",
"bbox": {
"l": 502.14,
"t": 421.07,
"r": 508.46,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 427.39,
"r_x1": 508.46,
"r_y1": 427.39,
"r_x2": 508.46,
"r_y2": 421.07,
"r_x3": 502.14,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 192,
"label": "text",
"bbox": {
"l": 515.1,
"t": 421.07,
"r": 521.42,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.39,
"r_x1": 521.42,
"r_y1": 427.39,
"r_x2": 521.42,
"r_y2": 421.07,
"r_x3": 515.1,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 193,
"label": "text",
"bbox": {
"l": 528.05,
"t": 421.07,
"r": 534.37,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 427.39,
"r_x1": 534.37,
"r_y1": 427.39,
"r_x2": 534.37,
"r_y2": 421.07,
"r_x3": 528.05,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 194,
"label": "text",
"bbox": {
"l": 385.28,
"t": 432.04,
"r": 391.6,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 438.36,
"r_x1": 391.6,
"r_y1": 438.36,
"r_x2": 391.6,
"r_y2": 432.04,
"r_x3": 385.28,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 195,
"label": "text",
"bbox": {
"l": 398.52,
"t": 432.04,
"r": 404.84,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 438.36,
"r_x1": 404.84,
"r_y1": 438.36,
"r_x2": 404.84,
"r_y2": 432.04,
"r_x3": 398.52,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 196,
"label": "text",
"bbox": {
"l": 411.48,
"t": 432.04,
"r": 417.8,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 438.36,
"r_x1": 417.8,
"r_y1": 438.36,
"r_x2": 417.8,
"r_y2": 432.04,
"r_x3": 411.48,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 197,
"label": "text",
"bbox": {
"l": 424.43,
"t": 432.04,
"r": 430.75,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 438.36,
"r_x1": 430.75,
"r_y1": 438.36,
"r_x2": 430.75,
"r_y2": 432.04,
"r_x3": 424.43,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 198,
"label": "text",
"bbox": {
"l": 437.38,
"t": 432.04,
"r": 443.7,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 438.36,
"r_x1": 443.7,
"r_y1": 438.36,
"r_x2": 443.7,
"r_y2": 432.04,
"r_x3": 437.38,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 199,
"label": "text",
"bbox": {
"l": 450.33,
"t": 432.04,
"r": 456.65,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 438.36,
"r_x1": 456.65,
"r_y1": 438.36,
"r_x2": 456.65,
"r_y2": 432.04,
"r_x3": 450.33,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 200,
"label": "text",
"bbox": {
"l": 463.29,
"t": 432.04,
"r": 469.61,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 438.36,
"r_x1": 469.61,
"r_y1": 438.36,
"r_x2": 469.61,
"r_y2": 432.04,
"r_x3": 463.29,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 201,
"label": "text",
"bbox": {
"l": 476.24,
"t": 432.04,
"r": 482.56,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 438.36,
"r_x1": 482.56,
"r_y1": 438.36,
"r_x2": 482.56,
"r_y2": 432.04,
"r_x3": 476.24,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 202,
"label": "text",
"bbox": {
"l": 489.19,
"t": 432.04,
"r": 495.51,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 438.36,
"r_x1": 495.51,
"r_y1": 438.36,
"r_x2": 495.51,
"r_y2": 432.04,
"r_x3": 489.19,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 203,
"label": "text",
"bbox": {
"l": 502.14,
"t": 432.04,
"r": 508.46,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 438.36,
"r_x1": 508.46,
"r_y1": 438.36,
"r_x2": 508.46,
"r_y2": 432.04,
"r_x3": 502.14,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 204,
"label": "text",
"bbox": {
"l": 515.1,
"t": 432.04,
"r": 521.42,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.36,
"r_x1": 521.42,
"r_y1": 438.36,
"r_x2": 521.42,
"r_y2": 432.04,
"r_x3": 515.1,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 205,
"label": "text",
"bbox": {
"l": 528.05,
"t": 432.04,
"r": 534.37,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 438.36,
"r_x1": 534.37,
"r_y1": 438.36,
"r_x2": 534.37,
"r_y2": 432.04,
"r_x3": 528.05,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 206,
"label": "text",
"bbox": {
"l": 385.28,
"t": 389.2,
"r": 388.44,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 395.52,
"r_x1": 388.44,
"r_y1": 395.52,
"r_x2": 388.44,
"r_y2": 389.2,
"r_x3": 385.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 207,
"label": "text",
"bbox": {
"l": 398.52,
"t": 389.2,
"r": 401.68,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 395.52,
"r_x1": 401.68,
"r_y1": 395.52,
"r_x2": 401.68,
"r_y2": 389.2,
"r_x3": 398.52,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 208,
"label": "text",
"bbox": {
"l": 411.48,
"t": 389.2,
"r": 414.63,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 395.52,
"r_x1": 414.63,
"r_y1": 395.52,
"r_x2": 414.63,
"r_y2": 389.2,
"r_x3": 411.48,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 209,
"label": "text",
"bbox": {
"l": 424.43,
"t": 389.2,
"r": 427.59,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 395.52,
"r_x1": 427.59,
"r_y1": 395.52,
"r_x2": 427.59,
"r_y2": 389.2,
"r_x3": 424.43,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 210,
"label": "text",
"bbox": {
"l": 437.38,
"t": 389.2,
"r": 440.54,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 395.52,
"r_x1": 440.54,
"r_y1": 395.52,
"r_x2": 440.54,
"r_y2": 389.2,
"r_x3": 437.38,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 211,
"label": "text",
"bbox": {
"l": 450.33,
"t": 389.2,
"r": 453.49,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 395.52,
"r_x1": 453.49,
"r_y1": 395.52,
"r_x2": 453.49,
"r_y2": 389.2,
"r_x3": 450.33,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 212,
"label": "text",
"bbox": {
"l": 463.28,
"t": 389.2,
"r": 466.44,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 395.52,
"r_x1": 466.44,
"r_y1": 395.52,
"r_x2": 466.44,
"r_y2": 389.2,
"r_x3": 463.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 213,
"label": "text",
"bbox": {
"l": 476.24,
"t": 389.2,
"r": 479.39,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 395.52,
"r_x1": 479.39,
"r_y1": 395.52,
"r_x2": 479.39,
"r_y2": 389.2,
"r_x3": 476.24,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 214,
"label": "text",
"bbox": {
"l": 489.19,
"t": 389.2,
"r": 492.35,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 395.52,
"r_x1": 492.35,
"r_y1": 395.52,
"r_x2": 492.35,
"r_y2": 389.2,
"r_x3": 489.19,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 215,
"label": "text",
"bbox": {
"l": 502.14,
"t": 389.2,
"r": 505.3,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 395.52,
"r_x1": 505.3,
"r_y1": 395.52,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.14,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 216,
"label": "text",
"bbox": {
"l": 515.09,
"t": 389.2,
"r": 521.41,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.09,
"r_y0": 395.52,
"r_x1": 521.41,
"r_y1": 395.52,
"r_x2": 521.41,
"r_y2": 389.2,
"r_x3": 515.09,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 217,
"label": "text",
"bbox": {
"l": 528.04,
"t": 389.2,
"r": 534.13,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.04,
"r_y0": 395.52,
"r_x1": 534.13,
"r_y1": 395.52,
"r_x2": 534.13,
"r_y2": 389.2,
"r_x3": 528.04,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 218,
"label": "text",
"bbox": {
"l": 385.28,
"t": 398.97,
"r": 391.6,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 405.29,
"r_x1": 391.6,
"r_y1": 405.29,
"r_x2": 391.6,
"r_y2": 398.97,
"r_x3": 385.28,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 219,
"label": "text",
"bbox": {
"l": 398.52,
"t": 398.97,
"r": 404.84,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 405.29,
"r_x1": 404.84,
"r_y1": 405.29,
"r_x2": 404.84,
"r_y2": 398.97,
"r_x3": 398.52,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 220,
"label": "text",
"bbox": {
"l": 411.48,
"t": 398.97,
"r": 417.8,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 405.29,
"r_x1": 417.8,
"r_y1": 405.29,
"r_x2": 417.8,
"r_y2": 398.97,
"r_x3": 411.48,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 221,
"label": "text",
"bbox": {
"l": 424.43,
"t": 406.77,
"r": 430.75,
"b": 413.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 413.09,
"r_x1": 430.75,
"r_y1": 413.09,
"r_x2": 430.75,
"r_y2": 406.77,
"r_x3": 424.43,
"r_y3": 406.77,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 222,
"label": "text",
"bbox": {
"l": 502.87,
"t": 410.99,
"r": 509.19,
"b": 417.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.87,
"r_y0": 417.31,
"r_x1": 509.19,
"r_y1": 417.31,
"r_x2": 509.19,
"r_y2": 410.99,
"r_x3": 502.87,
"r_y3": 410.99,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 223,
"label": "text",
"bbox": {
"l": 384.35,
"t": 381.78,
"r": 430.99,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.35,
"r_y0": 386.44,
"r_x1": 430.99,
"r_y1": 386.44,
"r_x2": 430.99,
"r_y2": 381.78,
"r_x3": 384.35,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 5,
"label": "caption",
"bbox": {
"l": 62.6,
"t": 458.73,
"r": 532.63,
"b": 467.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.915,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.6,
"r_y0": 467.63,
"r_x1": 532.63,
"r_y1": 467.63,
"r_x2": 532.63,
"r_y2": 458.73,
"r_x3": 62.6,
"r_y3": 458.73,
"coord_origin": "TOPLEFT"
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 491.4,
"r": 163.76,
"b": 501.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 501.25,
"r_x1": 64.45,
"r_y1": 501.25,
"r_x2": 64.45,
"r_y2": 491.4,
"r_x3": 50.11,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "5.5.",
"orig": "5.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.01,
"r_y0": 501.25,
"r_x1": 163.76,
"r_y1": 501.25,
"r_x2": 163.76,
"r_y2": 491.4,
"r_x3": 74.01,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "Qualitative Analysis",
"orig": "Qualitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 536.87,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 545.78,
"r_x1": 286.36,
"r_y1": 545.78,
"r_x2": 286.36,
"r_y2": 536.87,
"r_x3": 62.07,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "We showcase several visualizations for the different",
"orig": "We showcase several visualizations for the different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 557.73,
"r_x1": 211.16,
"r_y1": 557.73,
"r_x2": 211.16,
"r_y2": 548.83,
"r_x3": 50.11,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "components of our network on various",
"orig": "components of our network on various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 215.1,
"r_y0": 557.51,
"r_x1": 259.17,
"r_y1": 557.51,
"r_x2": 259.17,
"r_y2": 548.92,
"r_x3": 215.1,
"r_y3": 548.92,
"coord_origin": "TOPLEFT"
},
"text": "\u201ccomplex\u201d",
"orig": "\u201ccomplex\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.12,
"r_y0": 557.73,
"r_x1": 286.36,
"r_y1": 557.73,
"r_x2": 286.36,
"r_y2": 548.83,
"r_x3": 263.12,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "tables",
"orig": "tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 569.69,
"r_x1": 286.37,
"r_y1": 569.69,
"r_x2": 286.37,
"r_y2": 560.78,
"r_x3": 50.11,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "within datasets presented in this work in Fig. 5 and Fig. 6",
"orig": "within datasets presented in this work in Fig. 5 and Fig. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 581.64,
"r_x1": 286.37,
"r_y1": 581.64,
"r_x2": 286.37,
"r_y2": 572.74,
"r_x3": 50.11,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "As it is shown, our model is able to predict bounding boxes",
"orig": "As it is shown, our model is able to predict bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 593.6,
"r_x1": 286.37,
"r_y1": 593.6,
"r_x2": 286.37,
"r_y2": 584.69,
"r_x3": 50.11,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "for all table cells, even for the empty ones. Additionally,",
"orig": "for all table cells, even for the empty ones. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 605.56,
"r_x1": 286.37,
"r_y1": 605.56,
"r_x2": 286.37,
"r_y2": 596.65,
"r_x3": 50.11,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "our post-processing techniques can extract the cell content",
"orig": "our post-processing techniques can extract the cell content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 617.51,
"r_x1": 286.37,
"r_y1": 617.51,
"r_x2": 286.37,
"r_y2": 608.6,
"r_x3": 50.11,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "by matching the predicted bounding boxes to the PDF cells",
"orig": "by matching the predicted bounding boxes to the PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 629.47,
"r_x1": 286.37,
"r_y1": 629.47,
"r_x2": 286.37,
"r_y2": 620.56,
"r_x3": 50.11,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "based on their overlap and spatial proximity. The left part",
"orig": "based on their overlap and spatial proximity. The left part",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 641.42,
"r_x1": 286.37,
"r_y1": 641.42,
"r_x2": 286.37,
"r_y2": 632.51,
"r_x3": 50.11,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "of Fig. 5 demonstrates also the adaptability of our method",
"orig": "of Fig. 5 demonstrates also the adaptability of our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "to any language, as it can successfully extract Japanese",
"orig": "to any language, as it can successfully extract Japanese",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 50.11,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "text, although the training set contains only English content.",
"orig": "text, although the training set contains only English content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "We provide more visualizations including the intermediate",
"orig": "We provide more visualizations including the intermediate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "steps in the supplementary material. Overall these illustra-",
"orig": "steps in the supplementary material. Overall these illustra-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "tions justify the versatility of our method across a diverse",
"orig": "tions justify the versatility of our method across a diverse",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 226.89,
"r_y1": 713.15,
"r_x2": 226.89,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "range of table appearances and content type.",
"orig": "range of table appearances and content type.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 490.71,
"r": 460.85,
"b": 501.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.944,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 501.46,
"r_x1": 316.07,
"r_y1": 501.46,
"r_x2": 316.07,
"r_y2": 490.71,
"r_x3": 308.86,
"r_y3": 490.71,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.69,
"r_y0": 501.46,
"r_x1": 460.85,
"r_y1": 501.46,
"r_x2": 460.85,
"r_y2": 490.71,
"r_x3": 325.69,
"r_y3": 490.71,
"coord_origin": "TOPLEFT"
},
"text": "Future Work & Conclusion",
"orig": "Future Work & Conclusion",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 512.89,
"r": 545.12,
"b": 653.31,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 521.8,
"r_x1": 545.12,
"r_y1": 521.8,
"r_x2": 545.12,
"r_y2": 512.89,
"r_x3": 320.82,
"r_y3": 512.89,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we presented TableFormer an end-to-end",
"orig": "In this paper, we presented TableFormer an end-to-end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.75,
"r_x1": 545.12,
"r_y1": 533.75,
"r_x2": 545.12,
"r_y2": 524.85,
"r_x3": 308.86,
"r_y3": 524.85,
"coord_origin": "TOPLEFT"
},
"text": "transformer based approach to predict table structures and",
"orig": "transformer based approach to predict table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.71,
"r_x1": 545.12,
"r_y1": 545.71,
"r_x2": 545.12,
"r_y2": 536.8,
"r_x3": 308.86,
"r_y3": 536.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes of cells from an image. This approach en-",
"orig": "bounding boxes of cells from an image. This approach en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.66,
"r_x1": 545.12,
"r_y1": 557.66,
"r_x2": 545.12,
"r_y2": 548.76,
"r_x3": 308.86,
"r_y3": 548.76,
"coord_origin": "TOPLEFT"
},
"text": "ables us to recreate the table structure, and extract the cell",
"orig": "ables us to recreate the table structure, and extract the cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.62,
"r_x1": 545.12,
"r_y1": 569.62,
"r_x2": 545.12,
"r_y2": 560.71,
"r_x3": 308.86,
"r_y3": 560.71,
"coord_origin": "TOPLEFT"
},
"text": "content from PDF or OCR by using bounding boxes. Ad-",
"orig": "content from PDF or OCR by using bounding boxes. Ad-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.57,
"r_x1": 545.12,
"r_y1": 581.57,
"r_x2": 545.12,
"r_y2": 572.67,
"r_x3": 308.86,
"r_y3": 572.67,
"coord_origin": "TOPLEFT"
},
"text": "ditionally, it provides the versatility required in real-world",
"orig": "ditionally, it provides the versatility required in real-world",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.53,
"r_x1": 545.12,
"r_y1": 593.53,
"r_x2": 545.12,
"r_y2": 584.62,
"r_x3": 308.86,
"r_y3": 584.62,
"coord_origin": "TOPLEFT"
},
"text": "scenarios when dealing with various types of PDF docu-",
"orig": "scenarios when dealing with various types of PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.49,
"r_x1": 400.47,
"r_y1": 605.49,
"r_x2": 400.47,
"r_y2": 596.58,
"r_x3": 308.86,
"r_y3": 596.58,
"coord_origin": "TOPLEFT"
},
"text": "ments, and languages.",
"orig": "ments, and languages.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.38,
"r_y0": 605.49,
"r_x1": 545.12,
"r_y1": 605.49,
"r_x2": 545.12,
"r_y2": 596.58,
"r_x3": 408.38,
"r_y3": 596.58,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, our method outper-",
"orig": "Furthermore, our method outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.44,
"r_x1": 545.12,
"r_y1": 617.44,
"r_x2": 545.12,
"r_y2": 608.53,
"r_x3": 308.86,
"r_y3": 608.53,
"coord_origin": "TOPLEFT"
},
"text": "forms all state-of-the-arts with a wide margin. Finally, we",
"orig": "forms all state-of-the-arts with a wide margin. Finally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.4,
"r_x1": 545.12,
"r_y1": 629.4,
"r_x2": 545.12,
"r_y2": 620.49,
"r_x3": 308.86,
"r_y3": 620.49,
"coord_origin": "TOPLEFT"
},
"text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.35,
"r_x1": 545.12,
"r_y1": 641.35,
"r_x2": 545.12,
"r_y2": 632.44,
"r_x3": 308.86,
"r_y3": 632.44,
"coord_origin": "TOPLEFT"
},
"text": "erated dataset that reinforces missing characteristics from",
"orig": "erated dataset that reinforces missing characteristics from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.31,
"r_x1": 365.86,
"r_y1": 653.31,
"r_x2": 365.86,
"r_y2": 644.4,
"r_x3": 308.86,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "other datasets.",
"orig": "other datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 672.1,
"r": 364.41,
"b": 682.85,
"coord_origin": "TOPLEFT"
},
"confidence": 0.944,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 682.85,
"r_x1": 364.41,
"r_y1": 682.85,
"r_x2": 364.41,
"r_y2": 672.1,
"r_x3": 308.86,
"r_y3": 672.1,
"coord_origin": "TOPLEFT"
},
"text": "References",
"orig": "References",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "list_item",
"bbox": {
"l": 313.35,
"t": 693.96,
"r": 545.11,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.832,
"cells": [
{
"index": 217,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.35,
"r_y0": 701.98,
"r_x1": 323.81,
"r_y1": 701.98,
"r_x2": 323.81,
"r_y2": 693.96,
"r_x3": 313.35,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "[1]",
"orig": "[1]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 218,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.05,
"r_y0": 701.98,
"r_x1": 545.11,
"r_y1": 701.98,
"r_x2": 545.11,
"r_y2": 693.96,
"r_x3": 326.05,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 219,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 712.94,
"r_x1": 545.11,
"r_y1": 712.94,
"r_x2": 545.11,
"r_y2": 704.92,
"r_x3": 328.78,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.871,
"cells": [
{
"index": 220,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "picture",
"bbox": {
"l": 305.58,
"t": 98.65,
"r": 554.83,
"b": 180.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
{
"id": 14,
"label": "picture",
"bbox": {
"l": 49.98,
"t": 103.71,
"r": 301.63,
"b": 187.58,
"coord_origin": "TOPLEFT"
},
"confidence": 0.787,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"8": {
"label": "table",
"id": 8,
"page_no": 7,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 53.63,
"t": 218.95,
"r": 298.56,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 55,
"label": "text",
"bbox": {
"l": 209.93,
"t": 222.18,
"r": 241.04,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 263.76,
"t": 222.18,
"r": 284.51,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 110.25,
"t": 229.67,
"r": 120.62,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 175.37,
"t": 229.67,
"r": 196.11,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 196.11,
"t": 229.67,
"r": 201.29,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 209.62,
"t": 229.67,
"r": 219.99,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 229.2,
"t": 229.67,
"r": 244.75,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 256.11,
"t": 229.67,
"r": 266.48,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 278.38,
"t": 229.67,
"r": 293.94,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 55.53,
"t": 236.43,
"r": 162.71,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 184.4,
"t": 236.43,
"r": 189.56,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 208.99,
"t": 236.43,
"r": 214.16,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 234.88,
"t": 236.43,
"r": 237.46,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 256.88,
"t": 236.43,
"r": 264.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 284.06,
"t": 236.43,
"r": 286.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 55.53,
"t": 242.62,
"r": 139.72,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 183.11,
"t": 242.62,
"r": 190.86,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 207.7,
"t": 242.62,
"r": 215.45,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 234.88,
"t": 242.62,
"r": 237.46,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 256.88,
"t": 242.62,
"r": 264.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 284.06,
"t": 242.62,
"r": 286.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 55.53,
"t": 249.8,
"r": 97.01,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 92.7,
"t": 249.59,
"r": 103.03,
"b": 253.95,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 103.03,
"t": 249.8,
"r": 128.96,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 183.11,
"t": 248.82,
"r": 190.86,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 210.28,
"t": 248.82,
"r": 212.87,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 232.29,
"t": 248.82,
"r": 240.04,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 256.88,
"t": 248.82,
"r": 264.64,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 281.48,
"t": 248.82,
"r": 289.23,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 55.53,
"t": 257.28,
"r": 91.83,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 88.05,
"t": 257.07,
"r": 93.22,
"b": 261.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 93.22,
"t": 257.28,
"r": 119.15,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 116.45,
"t": 257.07,
"r": 129.88,
"b": 261.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 183.11,
"t": 256.3,
"r": 190.86,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 210.28,
"t": 256.3,
"r": 212.87,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 232.29,
"t": 256.3,
"r": 240.04,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 256.88,
"t": 256.3,
"r": 264.64,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 281.48,
"t": 256.3,
"r": 289.23,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 55.53,
"t": 264.51,
"r": 60.72,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 60.18,
"t": 264.3,
"r": 65.34,
"b": 268.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 65.34,
"t": 264.51,
"r": 122.38,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 116.45,
"t": 264.3,
"r": 129.88,
"b": 268.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 183.11,
"t": 263.53,
"r": 190.86,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 210.28,
"t": 263.53,
"r": 212.87,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 232.29,
"t": 263.53,
"r": 240.04,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 256.88,
"t": 263.53,
"r": 264.64,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 281.48,
"t": 263.53,
"r": 289.23,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 55.53,
"t": 271.74,
"r": 107.38,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 101.99,
"t": 271.53,
"r": 109.74,
"b": 275.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 109.74,
"t": 271.74,
"r": 114.93,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 114.39,
"t": 271.53,
"r": 122.14,
"b": 275.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 122.14,
"t": 271.74,
"r": 127.32,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 184.4,
"t": 270.75,
"r": 189.56,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 210.28,
"t": 270.75,
"r": 212.87,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 233.58,
"t": 270.75,
"r": 238.75,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 256.88,
"t": 270.75,
"r": 264.64,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 281.48,
"t": 270.75,
"r": 289.23,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 55.53,
"t": 279.01,
"r": 68.69,
"b": 283.37,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 68.69,
"t": 279.22,
"r": 110.17,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 183.11,
"t": 277.98,
"r": 190.86,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 208.99,
"t": 277.98,
"r": 214.16,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 233.58,
"t": 277.98,
"r": 238.75,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 256.88,
"t": 277.98,
"r": 264.64,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 282.77,
"t": 277.98,
"r": 287.94,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 169.62,
"t": 286.45,
"r": 174.8,
"b": 290.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 183.11,
"t": 285.47,
"r": 190.86,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 207.7,
"t": 285.47,
"r": 215.45,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 232.29,
"t": 285.47,
"r": 240.04,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 255.77,
"t": 285.47,
"r": 265.75,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 281.48,
"t": 285.47,
"r": 289.23,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 10,
"num_cols": 6,
"table_cells": [
{
"bbox": {
"l": 209.93,
"t": 222.18,
"r": 241.04,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 4,
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 263.76,
"t": 222.18,
"r": 284.51,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 6,
"text": "\u53c2\u8003\u6587\u732e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 110.25,
"t": 229.67,
"r": 120.62,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u51fa\u5178",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 175.37,
"t": 229.67,
"r": 196.11,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "\u30d5\u30a1\u30a4\u30eb \u6570",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.62,
"t": 229.67,
"r": 219.99,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 229.2,
"t": 229.67,
"r": 244.75,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.11,
"t": 229.67,
"r": 266.48,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 278.38,
"t": 229.67,
"r": 293.94,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 236.43,
"r": 162.71,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Association for Computational Linguistics(ACL2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 236.43,
"r": 189.56,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 208.99,
"t": 236.43,
"r": 214.16,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.88,
"t": 236.43,
"r": 237.46,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 236.43,
"r": 264.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.06,
"t": 236.43,
"r": 286.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 242.62,
"r": 139.72,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Computational Linguistics(COLING2002)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 242.62,
"r": 190.86,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 242.62,
"r": 215.45,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.88,
"t": 242.62,
"r": 237.46,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 242.62,
"r": 264.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.06,
"t": 242.62,
"r": 286.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 249.8,
"r": 97.01,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 248.82,
"r": 190.86,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 248.82,
"r": 212.87,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 248.82,
"r": 240.04,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "142",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 248.82,
"r": 264.64,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "223",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 248.82,
"r": 289.23,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 257.28,
"r": 91.83,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 256.3,
"r": 190.86,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "177",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 256.3,
"r": 212.87,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 256.3,
"r": 240.04,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "176",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 256.3,
"r": 264.64,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 256.3,
"r": 289.23,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "236",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 264.51,
"r": 60.72,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 263.53,
"r": 190.86,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "208",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 263.53,
"r": 212.87,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 263.53,
"r": 240.04,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "203",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 263.53,
"r": 264.64,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "152",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 263.53,
"r": 289.23,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "244",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 271.74,
"r": 107.38,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 270.75,
"r": 189.56,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "98",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 270.75,
"r": 212.87,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.58,
"t": 270.75,
"r": 238.75,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 270.75,
"r": 264.64,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 270.75,
"r": 289.23,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "232",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 279.01,
"r": 68.69,
"b": 283.37,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 277.98,
"r": 190.86,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "107",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 208.99,
"t": 277.98,
"r": 214.16,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "73",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.58,
"t": 277.98,
"r": 238.75,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "34",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 277.98,
"r": 264.64,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 282.77,
"t": 277.98,
"r": 287.94,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 169.62,
"t": 286.45,
"r": 174.8,
"b": 290.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u8a08",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 285.47,
"r": 190.86,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "945",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 285.47,
"r": 215.45,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "294",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 285.47,
"r": 240.04,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "651",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 255.77,
"t": 285.47,
"r": 265.75,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "1122",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 285.47,
"r": 289.23,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "955",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
"7": {
"label": "table",
"id": 7,
"page_no": 7,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 304.92,
"t": 218.51,
"r": 550.23,
"b": 287.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 125,
"label": "text",
"bbox": {
"l": 459.05,
"t": 221.62,
"r": 542.0,
"b": 226.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 493.82,
"t": 227.83,
"r": 507.23,
"b": 232.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 393.24,
"t": 236.75,
"r": 400.75,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 128,
"label": "text",
"bbox": {
"l": 400.75,
"t": 236.75,
"r": 404.65,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 129,
"label": "text",
"bbox": {
"l": 404.65,
"t": 236.75,
"r": 407.35,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 130,
"label": "text",
"bbox": {
"l": 392.1,
"t": 221.57,
"r": 438.01,
"b": 226.64,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 131,
"label": "text",
"bbox": {
"l": 427.18,
"t": 236.75,
"r": 440.99,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 132,
"label": "text",
"bbox": {
"l": 468.38,
"t": 236.75,
"r": 482.48,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 133,
"label": "text",
"bbox": {
"l": 516.93,
"t": 236.75,
"r": 530.73,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 134,
"label": "text",
"bbox": {
"l": 306.11,
"t": 244.61,
"r": 355.65,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 135,
"label": "text",
"bbox": {
"l": 355.65,
"t": 244.61,
"r": 364.66,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 136,
"label": "text",
"bbox": {
"l": 396.25,
"t": 244.91,
"r": 400.75,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 137,
"label": "text",
"bbox": {
"l": 400.75,
"t": 244.91,
"r": 403.76,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 138,
"label": "text",
"bbox": {
"l": 429.82,
"t": 244.91,
"r": 437.33,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 139,
"label": "text",
"bbox": {
"l": 465.53,
"t": 244.91,
"r": 478.4,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 140,
"label": "text",
"bbox": {
"l": 480.98,
"t": 244.91,
"r": 483.55,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 141,
"label": "text",
"bbox": {
"l": 513.45,
"t": 244.91,
"r": 531.47,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 142,
"label": "text",
"bbox": {
"l": 306.11,
"t": 253.68,
"r": 325.63,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 143,
"label": "text",
"bbox": {
"l": 396.25,
"t": 253.68,
"r": 400.75,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 144,
"label": "text",
"bbox": {
"l": 400.75,
"t": 253.68,
"r": 403.76,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 145,
"label": "text",
"bbox": {
"l": 429.82,
"t": 253.68,
"r": 437.33,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 146,
"label": "text",
"bbox": {
"l": 466.44,
"t": 253.68,
"r": 482.55,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 147,
"label": "text",
"bbox": {
"l": 514.29,
"t": 253.68,
"r": 530.81,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 148,
"label": "text",
"bbox": {
"l": 306.11,
"t": 261.55,
"r": 322.63,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 149,
"label": "text",
"bbox": {
"l": 394.43,
"t": 261.55,
"r": 400.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 150,
"label": "text",
"bbox": {
"l": 400.73,
"t": 261.55,
"r": 403.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 151,
"label": "text",
"bbox": {
"l": 403.74,
"t": 261.55,
"r": 405.54,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 152,
"label": "text",
"bbox": {
"l": 427.7,
"t": 261.55,
"r": 438.81,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 153,
"label": "text",
"bbox": {
"l": 468.56,
"t": 261.55,
"r": 482.07,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 154,
"label": "text",
"bbox": {
"l": 516.02,
"t": 261.55,
"r": 529.53,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 155,
"label": "text",
"bbox": {
"l": 306.11,
"t": 269.64,
"r": 356.25,
"b": 274.71,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 156,
"label": "text",
"bbox": {
"l": 394.43,
"t": 270.32,
"r": 400.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 157,
"label": "text",
"bbox": {
"l": 400.73,
"t": 270.32,
"r": 403.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 158,
"label": "text",
"bbox": {
"l": 403.74,
"t": 270.32,
"r": 405.54,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 159,
"label": "text",
"bbox": {
"l": 431.03,
"t": 270.32,
"r": 436.43,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 160,
"label": "text",
"bbox": {
"l": 465.83,
"t": 270.32,
"r": 482.35,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 161,
"label": "text",
"bbox": {
"l": 516.02,
"t": 270.32,
"r": 529.53,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 162,
"label": "text",
"bbox": {
"l": 306.11,
"t": 278.49,
"r": 373.36,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 163,
"label": "text",
"bbox": {
"l": 396.25,
"t": 278.49,
"r": 403.76,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 164,
"label": "text",
"bbox": {
"l": 429.52,
"t": 278.49,
"r": 437.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 165,
"label": "text",
"bbox": {
"l": 463.71,
"t": 278.49,
"r": 484.74,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 166,
"label": "text",
"bbox": {
"l": 512.99,
"t": 278.49,
"r": 534.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 459.05,
"t": 221.62,
"r": 542.0,
"b": 226.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 5,
"text": "Weighted Average Grant Date Fair Value",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 393.24,
"t": 236.75,
"r": 400.75,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "RS U s",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 392.1,
"t": 221.57,
"r": 438.01,
"b": 226.64,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 3,
"text": "Shares (in millions)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.18,
"t": 236.75,
"r": 440.99,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.38,
"t": 236.75,
"r": 482.48,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "RSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.93,
"t": 236.75,
"r": 530.73,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 244.61,
"r": 355.65,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on Janua ry 1",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 244.91,
"r": 400.75,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1. 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.82,
"t": 244.91,
"r": 437.33,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.53,
"t": 244.91,
"r": 478.4,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "90.10 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.45,
"t": 244.91,
"r": 531.47,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 91.19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 253.68,
"r": 325.63,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Granted",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 253.68,
"r": 400.75,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "0. 5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.82,
"t": 253.68,
"r": 437.33,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 466.44,
"t": 253.68,
"r": 482.55,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "117.44",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 514.29,
"t": 253.68,
"r": 530.81,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "122.41",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 261.55,
"r": 322.63,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Vested",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.43,
"t": 261.55,
"r": 400.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 5 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.7,
"t": 261.55,
"r": 438.81,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "(0.1)",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.56,
"t": 261.55,
"r": 482.07,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "87.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.02,
"t": 261.55,
"r": 529.53,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "81.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 269.64,
"r": 356.25,
"b": 274.71,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Canceled or forfeited",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.43,
"t": 270.32,
"r": 400.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 1 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 431.03,
"t": 270.32,
"r": 436.43,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.83,
"t": 270.32,
"r": 482.35,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "102.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.02,
"t": 270.32,
"r": 529.53,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "92.18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 278.49,
"r": 373.36,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on December 31",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 278.49,
"r": 403.76,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.52,
"t": 278.49,
"r": 437.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 463.71,
"t": 278.49,
"r": 484.74,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "104.85 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.99,
"t": 278.49,
"r": 534.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 104.51",
"column_header": false,
"row_header": false,
"row_section": false
}
]
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "caption",
"id": 18,
"page_no": 7,
"cluster": {
"id": 18,
"label": "caption",
"bbox": {
"l": 53.81,
"t": 208.23,
"r": 385.93,
"b": 216.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.599,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.81,
"r_y0": 216.11,
"r_x1": 62.22,
"r_y1": 216.11,
"r_x2": 62.22,
"r_y2": 208.23,
"r_x3": 53.81,
"r_y3": 208.23,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.42,
"r_y0": 216.11,
"r_x1": 385.93,
"r_y1": 216.11,
"r_x2": 385.93,
"r_y2": 208.23,
"r_x3": 66.42,
"r_y3": 208.23,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:"
},
{
"label": "section_header",
"id": 29,
"page_no": 7,
"cluster": {
"id": 29,
"label": "section_header",
"bbox": {
"l": 53.81,
"t": 94.28,
"r": 284.35,
"b": 102.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.465,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.81,
"r_y0": 102.15,
"r_x1": 284.35,
"r_y1": 102.15,
"r_x2": 284.35,
"r_y2": 94.28,
"r_x3": 53.81,
"r_y3": 94.28,
"coord_origin": "TOPLEFT"
},
"text": "Japanese language (previously unseen by TableFormer):",
"orig": "Japanese language (previously unseen by TableFormer):",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Japanese language (previously unseen by TableFormer):"
},
{
"label": "section_header",
"id": 31,
"page_no": 7,
"cluster": {
"id": 31,
"label": "section_header",
"bbox": {
"l": 304.83,
"t": 94.28,
"r": 431.09,
"b": 102.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.463,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 304.83,
"r_y0": 102.15,
"r_x1": 431.09,
"r_y1": 102.15,
"r_x2": 431.09,
"r_y2": 94.28,
"r_x3": 304.83,
"r_y3": 94.28,
"coord_origin": "TOPLEFT"
},
"text": "Example table from FinTabNet:",
"orig": "Example table from FinTabNet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Example table from FinTabNet:"
},
{
"label": "list_item",
"id": 20,
"page_no": 7,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 53.29,
"t": 78.69,
"r": 61.55,
"b": 86.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.582,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.29,
"r_y0": 86.56,
"r_x1": 61.55,
"r_y1": 86.56,
"r_x2": 61.55,
"r_y2": 78.69,
"r_x3": 53.29,
"r_y3": 78.69,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "a."
},
{
"label": "list_item",
"id": 21,
"page_no": 7,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 65.68,
"t": 78.69,
"r": 499.56,
"b": 86.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.541,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.68,
"r_y0": 86.56,
"r_x1": 499.56,
"r_y1": 86.56,
"r_x2": 499.56,
"r_y2": 78.69,
"r_x3": 65.68,
"r_y3": 78.69,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells"
},
{
"label": "table",
"id": 8,
"page_no": 7,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 53.63,
"t": 218.95,
"r": 298.56,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 55,
"label": "text",
"bbox": {
"l": 209.93,
"t": 222.18,
"r": 241.04,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 263.76,
"t": 222.18,
"r": 284.51,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 110.25,
"t": 229.67,
"r": 120.62,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 175.37,
"t": 229.67,
"r": 196.11,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 196.11,
"t": 229.67,
"r": 201.29,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 209.62,
"t": 229.67,
"r": 219.99,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 229.2,
"t": 229.67,
"r": 244.75,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 256.11,
"t": 229.67,
"r": 266.48,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 278.38,
"t": 229.67,
"r": 293.94,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 55.53,
"t": 236.43,
"r": 162.71,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 184.4,
"t": 236.43,
"r": 189.56,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 208.99,
"t": 236.43,
"r": 214.16,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 234.88,
"t": 236.43,
"r": 237.46,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 256.88,
"t": 236.43,
"r": 264.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 284.06,
"t": 236.43,
"r": 286.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 55.53,
"t": 242.62,
"r": 139.72,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 183.11,
"t": 242.62,
"r": 190.86,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 207.7,
"t": 242.62,
"r": 215.45,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 234.88,
"t": 242.62,
"r": 237.46,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 256.88,
"t": 242.62,
"r": 264.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 284.06,
"t": 242.62,
"r": 286.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 55.53,
"t": 249.8,
"r": 97.01,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 92.7,
"t": 249.59,
"r": 103.03,
"b": 253.95,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 103.03,
"t": 249.8,
"r": 128.96,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 183.11,
"t": 248.82,
"r": 190.86,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 210.28,
"t": 248.82,
"r": 212.87,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 232.29,
"t": 248.82,
"r": 240.04,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 256.88,
"t": 248.82,
"r": 264.64,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 281.48,
"t": 248.82,
"r": 289.23,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 55.53,
"t": 257.28,
"r": 91.83,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 88.05,
"t": 257.07,
"r": 93.22,
"b": 261.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 93.22,
"t": 257.28,
"r": 119.15,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 116.45,
"t": 257.07,
"r": 129.88,
"b": 261.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 183.11,
"t": 256.3,
"r": 190.86,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 210.28,
"t": 256.3,
"r": 212.87,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 232.29,
"t": 256.3,
"r": 240.04,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 256.88,
"t": 256.3,
"r": 264.64,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 281.48,
"t": 256.3,
"r": 289.23,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 55.53,
"t": 264.51,
"r": 60.72,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 60.18,
"t": 264.3,
"r": 65.34,
"b": 268.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 65.34,
"t": 264.51,
"r": 122.38,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 116.45,
"t": 264.3,
"r": 129.88,
"b": 268.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 183.11,
"t": 263.53,
"r": 190.86,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 210.28,
"t": 263.53,
"r": 212.87,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 232.29,
"t": 263.53,
"r": 240.04,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 256.88,
"t": 263.53,
"r": 264.64,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 281.48,
"t": 263.53,
"r": 289.23,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 55.53,
"t": 271.74,
"r": 107.38,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 101.99,
"t": 271.53,
"r": 109.74,
"b": 275.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 109.74,
"t": 271.74,
"r": 114.93,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 114.39,
"t": 271.53,
"r": 122.14,
"b": 275.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 122.14,
"t": 271.74,
"r": 127.32,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 184.4,
"t": 270.75,
"r": 189.56,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 210.28,
"t": 270.75,
"r": 212.87,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 233.58,
"t": 270.75,
"r": 238.75,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 256.88,
"t": 270.75,
"r": 264.64,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 281.48,
"t": 270.75,
"r": 289.23,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 55.53,
"t": 279.01,
"r": 68.69,
"b": 283.37,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 68.69,
"t": 279.22,
"r": 110.17,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 183.11,
"t": 277.98,
"r": 190.86,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 208.99,
"t": 277.98,
"r": 214.16,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 233.58,
"t": 277.98,
"r": 238.75,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 256.88,
"t": 277.98,
"r": 264.64,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 282.77,
"t": 277.98,
"r": 287.94,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 169.62,
"t": 286.45,
"r": 174.8,
"b": 290.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 183.11,
"t": 285.47,
"r": 190.86,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 207.7,
"t": 285.47,
"r": 215.45,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 232.29,
"t": 285.47,
"r": 240.04,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 255.77,
"t": 285.47,
"r": 265.75,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 281.48,
"t": 285.47,
"r": 289.23,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 10,
"num_cols": 6,
"table_cells": [
{
"bbox": {
"l": 209.93,
"t": 222.18,
"r": 241.04,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 4,
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 263.76,
"t": 222.18,
"r": 284.51,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 6,
"text": "\u53c2\u8003\u6587\u732e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 110.25,
"t": 229.67,
"r": 120.62,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u51fa\u5178",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 175.37,
"t": 229.67,
"r": 196.11,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "\u30d5\u30a1\u30a4\u30eb \u6570",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.62,
"t": 229.67,
"r": 219.99,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 229.2,
"t": 229.67,
"r": 244.75,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.11,
"t": 229.67,
"r": 266.48,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 278.38,
"t": 229.67,
"r": 293.94,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 236.43,
"r": 162.71,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Association for Computational Linguistics(ACL2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 236.43,
"r": 189.56,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 208.99,
"t": 236.43,
"r": 214.16,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.88,
"t": 236.43,
"r": 237.46,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 236.43,
"r": 264.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.06,
"t": 236.43,
"r": 286.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 242.62,
"r": 139.72,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Computational Linguistics(COLING2002)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 242.62,
"r": 190.86,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 242.62,
"r": 215.45,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.88,
"t": 242.62,
"r": 237.46,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 242.62,
"r": 264.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.06,
"t": 242.62,
"r": 286.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 249.8,
"r": 97.01,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 248.82,
"r": 190.86,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 248.82,
"r": 212.87,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 248.82,
"r": 240.04,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "142",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 248.82,
"r": 264.64,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "223",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 248.82,
"r": 289.23,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 257.28,
"r": 91.83,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 256.3,
"r": 190.86,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "177",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 256.3,
"r": 212.87,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 256.3,
"r": 240.04,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "176",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 256.3,
"r": 264.64,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 256.3,
"r": 289.23,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "236",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 264.51,
"r": 60.72,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 263.53,
"r": 190.86,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "208",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 263.53,
"r": 212.87,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 263.53,
"r": 240.04,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "203",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 263.53,
"r": 264.64,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "152",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 263.53,
"r": 289.23,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "244",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 271.74,
"r": 107.38,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 270.75,
"r": 189.56,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "98",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 270.75,
"r": 212.87,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.58,
"t": 270.75,
"r": 238.75,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 270.75,
"r": 264.64,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 270.75,
"r": 289.23,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "232",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 279.01,
"r": 68.69,
"b": 283.37,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 277.98,
"r": 190.86,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "107",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 208.99,
"t": 277.98,
"r": 214.16,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "73",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.58,
"t": 277.98,
"r": 238.75,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "34",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 277.98,
"r": 264.64,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 282.77,
"t": 277.98,
"r": 287.94,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 169.62,
"t": 286.45,
"r": 174.8,
"b": 290.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u8a08",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 285.47,
"r": 190.86,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "945",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 285.47,
"r": 215.45,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "294",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 285.47,
"r": 240.04,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "651",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 255.77,
"t": 285.47,
"r": 265.75,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "1122",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 285.47,
"r": 289.23,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "955",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 16,
"page_no": 7,
"cluster": {
"id": 16,
"label": "caption",
"bbox": {
"l": 380.43,
"t": 292.3,
"r": 549.42,
"b": 298.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.43,
"r_y0": 298.6,
"r_x1": 549.42,
"r_y1": 298.6,
"r_x2": 549.42,
"r_y2": 292.3,
"r_x3": 380.43,
"r_y3": 292.3,
"coord_origin": "TOPLEFT"
},
"text": "Text is aligned to match original for ease of viewing",
"orig": "Text is aligned to match original for ease of viewing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Text is aligned to match original for ease of viewing"
},
{
"label": "table",
"id": 7,
"page_no": 7,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 304.92,
"t": 218.51,
"r": 550.23,
"b": 287.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 125,
"label": "text",
"bbox": {
"l": 459.05,
"t": 221.62,
"r": 542.0,
"b": 226.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 493.82,
"t": 227.83,
"r": 507.23,
"b": 232.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 393.24,
"t": 236.75,
"r": 400.75,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 128,
"label": "text",
"bbox": {
"l": 400.75,
"t": 236.75,
"r": 404.65,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 129,
"label": "text",
"bbox": {
"l": 404.65,
"t": 236.75,
"r": 407.35,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 130,
"label": "text",
"bbox": {
"l": 392.1,
"t": 221.57,
"r": 438.01,
"b": 226.64,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 131,
"label": "text",
"bbox": {
"l": 427.18,
"t": 236.75,
"r": 440.99,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 132,
"label": "text",
"bbox": {
"l": 468.38,
"t": 236.75,
"r": 482.48,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 133,
"label": "text",
"bbox": {
"l": 516.93,
"t": 236.75,
"r": 530.73,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 134,
"label": "text",
"bbox": {
"l": 306.11,
"t": 244.61,
"r": 355.65,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 135,
"label": "text",
"bbox": {
"l": 355.65,
"t": 244.61,
"r": 364.66,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 136,
"label": "text",
"bbox": {
"l": 396.25,
"t": 244.91,
"r": 400.75,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 137,
"label": "text",
"bbox": {
"l": 400.75,
"t": 244.91,
"r": 403.76,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 138,
"label": "text",
"bbox": {
"l": 429.82,
"t": 244.91,
"r": 437.33,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 139,
"label": "text",
"bbox": {
"l": 465.53,
"t": 244.91,
"r": 478.4,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 140,
"label": "text",
"bbox": {
"l": 480.98,
"t": 244.91,
"r": 483.55,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 141,
"label": "text",
"bbox": {
"l": 513.45,
"t": 244.91,
"r": 531.47,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 142,
"label": "text",
"bbox": {
"l": 306.11,
"t": 253.68,
"r": 325.63,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 143,
"label": "text",
"bbox": {
"l": 396.25,
"t": 253.68,
"r": 400.75,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 144,
"label": "text",
"bbox": {
"l": 400.75,
"t": 253.68,
"r": 403.76,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 145,
"label": "text",
"bbox": {
"l": 429.82,
"t": 253.68,
"r": 437.33,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 146,
"label": "text",
"bbox": {
"l": 466.44,
"t": 253.68,
"r": 482.55,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 147,
"label": "text",
"bbox": {
"l": 514.29,
"t": 253.68,
"r": 530.81,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 148,
"label": "text",
"bbox": {
"l": 306.11,
"t": 261.55,
"r": 322.63,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 149,
"label": "text",
"bbox": {
"l": 394.43,
"t": 261.55,
"r": 400.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 150,
"label": "text",
"bbox": {
"l": 400.73,
"t": 261.55,
"r": 403.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 151,
"label": "text",
"bbox": {
"l": 403.74,
"t": 261.55,
"r": 405.54,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 152,
"label": "text",
"bbox": {
"l": 427.7,
"t": 261.55,
"r": 438.81,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 153,
"label": "text",
"bbox": {
"l": 468.56,
"t": 261.55,
"r": 482.07,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 154,
"label": "text",
"bbox": {
"l": 516.02,
"t": 261.55,
"r": 529.53,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 155,
"label": "text",
"bbox": {
"l": 306.11,
"t": 269.64,
"r": 356.25,
"b": 274.71,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 156,
"label": "text",
"bbox": {
"l": 394.43,
"t": 270.32,
"r": 400.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 157,
"label": "text",
"bbox": {
"l": 400.73,
"t": 270.32,
"r": 403.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 158,
"label": "text",
"bbox": {
"l": 403.74,
"t": 270.32,
"r": 405.54,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 159,
"label": "text",
"bbox": {
"l": 431.03,
"t": 270.32,
"r": 436.43,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 160,
"label": "text",
"bbox": {
"l": 465.83,
"t": 270.32,
"r": 482.35,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 161,
"label": "text",
"bbox": {
"l": 516.02,
"t": 270.32,
"r": 529.53,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 162,
"label": "text",
"bbox": {
"l": 306.11,
"t": 278.49,
"r": 373.36,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 163,
"label": "text",
"bbox": {
"l": 396.25,
"t": 278.49,
"r": 403.76,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 164,
"label": "text",
"bbox": {
"l": 429.52,
"t": 278.49,
"r": 437.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 165,
"label": "text",
"bbox": {
"l": 463.71,
"t": 278.49,
"r": 484.74,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 166,
"label": "text",
"bbox": {
"l": 512.99,
"t": 278.49,
"r": 534.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 459.05,
"t": 221.62,
"r": 542.0,
"b": 226.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 5,
"text": "Weighted Average Grant Date Fair Value",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 393.24,
"t": 236.75,
"r": 400.75,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "RS U s",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 392.1,
"t": 221.57,
"r": 438.01,
"b": 226.64,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 3,
"text": "Shares (in millions)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.18,
"t": 236.75,
"r": 440.99,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.38,
"t": 236.75,
"r": 482.48,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "RSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.93,
"t": 236.75,
"r": 530.73,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 244.61,
"r": 355.65,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on Janua ry 1",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 244.91,
"r": 400.75,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1. 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.82,
"t": 244.91,
"r": 437.33,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.53,
"t": 244.91,
"r": 478.4,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "90.10 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.45,
"t": 244.91,
"r": 531.47,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 91.19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 253.68,
"r": 325.63,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Granted",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 253.68,
"r": 400.75,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "0. 5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.82,
"t": 253.68,
"r": 437.33,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 466.44,
"t": 253.68,
"r": 482.55,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "117.44",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 514.29,
"t": 253.68,
"r": 530.81,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "122.41",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 261.55,
"r": 322.63,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Vested",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.43,
"t": 261.55,
"r": 400.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 5 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.7,
"t": 261.55,
"r": 438.81,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "(0.1)",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.56,
"t": 261.55,
"r": 482.07,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "87.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.02,
"t": 261.55,
"r": 529.53,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "81.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 269.64,
"r": 356.25,
"b": 274.71,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Canceled or forfeited",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.43,
"t": 270.32,
"r": 400.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 1 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 431.03,
"t": 270.32,
"r": 436.43,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.83,
"t": 270.32,
"r": 482.35,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "102.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.02,
"t": 270.32,
"r": 529.53,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "92.18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 278.49,
"r": 373.36,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on December 31",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 278.49,
"r": 403.76,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.52,
"t": 278.49,
"r": 437.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 463.71,
"t": 278.49,
"r": 484.74,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "104.85 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.99,
"t": 278.49,
"r": 534.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 104.51",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 6,
"page_no": 7,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 320.88,
"r": 545.11,
"b": 365.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.914,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 329.78,
"r_x1": 86.86,
"r_y1": 329.78,
"r_x2": 86.86,
"r_y2": 320.88,
"r_x3": 50.11,
"r_y3": 320.88,
"coord_origin": "TOPLEFT"
},
"text": "Figure 5:",
"orig": "Figure 5:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.92,
"r_y0": 329.78,
"r_x1": 545.11,
"r_y1": 329.78,
"r_x2": 545.11,
"r_y2": 320.88,
"r_x3": 93.92,
"r_y3": 320.88,
"coord_origin": "TOPLEFT"
},
"text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 341.74,
"r_x1": 545.11,
"r_y1": 341.74,
"r_x2": 545.11,
"r_y2": 332.83,
"r_x3": 50.11,
"r_y3": 332.83,
"coord_origin": "TOPLEFT"
},
"text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 353.69,
"r_x1": 545.11,
"r_y1": 353.69,
"r_x2": 545.11,
"r_y2": 344.79,
"r_x3": 50.11,
"r_y3": 344.79,
"coord_origin": "TOPLEFT"
},
"text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 365.65,
"r_x1": 139.8,
"r_y1": 365.65,
"r_x2": 139.8,
"r_y2": 356.74,
"r_x3": 50.11,
"r_y3": 356.74,
"coord_origin": "TOPLEFT"
},
"text": "the FinTabNet dataset.",
"orig": "the FinTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset."
},
{
"label": "picture",
"id": 12,
"page_no": 7,
"cluster": {
"id": 12,
"label": "picture",
"bbox": {
"l": 216.77,
"t": 380.49,
"r": 375.78,
"b": 443.35,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.26,
"r_y0": 386.44,
"r_x1": 342.08,
"r_y1": 386.44,
"r_x2": 342.08,
"r_y2": 381.78,
"r_x3": 220.26,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 167,
"label": "text",
"bbox": {
"l": 220.26,
"t": 381.78,
"r": 342.08,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.26,
"r_y0": 386.44,
"r_x1": 342.08,
"r_y1": 386.44,
"r_x2": 342.08,
"r_y2": 381.78,
"r_x3": 220.26,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 11,
"page_no": 7,
"cluster": {
"id": 11,
"label": "picture",
"bbox": {
"l": 51.74,
"t": 380.48,
"r": 211.84,
"b": 443.66,
"coord_origin": "TOPLEFT"
},
"confidence": 0.831,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.72,
"r_y0": 386.44,
"r_x1": 85.66,
"r_y1": 386.44,
"r_x2": 85.66,
"r_y2": 381.78,
"r_x3": 53.72,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 168,
"label": "text",
"bbox": {
"l": 53.72,
"t": 381.78,
"r": 85.66,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.72,
"r_y0": 386.44,
"r_x1": 85.66,
"r_y1": 386.44,
"r_x2": 85.66,
"r_y2": 381.78,
"r_x3": 53.72,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 13,
"page_no": 7,
"cluster": {
"id": 13,
"label": "picture",
"bbox": {
"l": 383.14,
"t": 381.23,
"r": 542.11,
"b": 442.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.788,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 406.87,
"r_x1": 443.7,
"r_y1": 406.87,
"r_x2": 443.7,
"r_y2": 400.55,
"r_x3": 437.38,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 406.87,
"r_x1": 456.65,
"r_y1": 406.87,
"r_x2": 456.65,
"r_y2": 400.55,
"r_x3": 450.33,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 406.87,
"r_x1": 469.6,
"r_y1": 406.87,
"r_x2": 469.6,
"r_y2": 400.55,
"r_x3": 463.28,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 406.87,
"r_x1": 482.56,
"r_y1": 406.87,
"r_x2": 482.56,
"r_y2": 400.55,
"r_x3": 476.24,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 406.87,
"r_x1": 495.51,
"r_y1": 406.87,
"r_x2": 495.51,
"r_y2": 400.55,
"r_x3": 489.19,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 406.87,
"r_x1": 508.46,
"r_y1": 406.87,
"r_x2": 508.46,
"r_y2": 400.55,
"r_x3": 502.14,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.87,
"r_x1": 521.41,
"r_y1": 406.87,
"r_x2": 521.41,
"r_y2": 400.55,
"r_x3": 515.1,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 417.36,
"r_x1": 391.6,
"r_y1": 417.36,
"r_x2": 391.6,
"r_y2": 411.04,
"r_x3": 385.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 417.36,
"r_x1": 404.84,
"r_y1": 417.36,
"r_x2": 404.84,
"r_y2": 411.04,
"r_x3": 398.52,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 417.36,
"r_x1": 417.8,
"r_y1": 417.36,
"r_x2": 417.8,
"r_y2": 411.04,
"r_x3": 411.48,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 417.36,
"r_x1": 443.7,
"r_y1": 417.36,
"r_x2": 443.7,
"r_y2": 411.04,
"r_x3": 437.38,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 417.36,
"r_x1": 456.65,
"r_y1": 417.36,
"r_x2": 456.65,
"r_y2": 411.04,
"r_x3": 450.33,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 417.36,
"r_x1": 469.6,
"r_y1": 417.36,
"r_x2": 469.6,
"r_y2": 411.04,
"r_x3": 463.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 427.39,
"r_x1": 391.6,
"r_y1": 427.39,
"r_x2": 391.6,
"r_y2": 421.07,
"r_x3": 385.28,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 427.39,
"r_x1": 404.84,
"r_y1": 427.39,
"r_x2": 404.84,
"r_y2": 421.07,
"r_x3": 398.52,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 427.39,
"r_x1": 417.8,
"r_y1": 427.39,
"r_x2": 417.8,
"r_y2": 421.07,
"r_x3": 411.48,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 427.39,
"r_x1": 430.75,
"r_y1": 427.39,
"r_x2": 430.75,
"r_y2": 421.07,
"r_x3": 424.43,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 427.39,
"r_x1": 443.7,
"r_y1": 427.39,
"r_x2": 443.7,
"r_y2": 421.07,
"r_x3": 437.38,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 427.39,
"r_x1": 456.65,
"r_y1": 427.39,
"r_x2": 456.65,
"r_y2": 421.07,
"r_x3": 450.33,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 427.39,
"r_x1": 469.61,
"r_y1": 427.39,
"r_x2": 469.61,
"r_y2": 421.07,
"r_x3": 463.29,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 427.39,
"r_x1": 482.56,
"r_y1": 427.39,
"r_x2": 482.56,
"r_y2": 421.07,
"r_x3": 476.24,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 427.39,
"r_x1": 495.51,
"r_y1": 427.39,
"r_x2": 495.51,
"r_y2": 421.07,
"r_x3": 489.19,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 427.39,
"r_x1": 508.46,
"r_y1": 427.39,
"r_x2": 508.46,
"r_y2": 421.07,
"r_x3": 502.14,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.39,
"r_x1": 521.42,
"r_y1": 427.39,
"r_x2": 521.42,
"r_y2": 421.07,
"r_x3": 515.1,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 427.39,
"r_x1": 534.37,
"r_y1": 427.39,
"r_x2": 534.37,
"r_y2": 421.07,
"r_x3": 528.05,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 438.36,
"r_x1": 391.6,
"r_y1": 438.36,
"r_x2": 391.6,
"r_y2": 432.04,
"r_x3": 385.28,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 438.36,
"r_x1": 404.84,
"r_y1": 438.36,
"r_x2": 404.84,
"r_y2": 432.04,
"r_x3": 398.52,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 438.36,
"r_x1": 417.8,
"r_y1": 438.36,
"r_x2": 417.8,
"r_y2": 432.04,
"r_x3": 411.48,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 438.36,
"r_x1": 430.75,
"r_y1": 438.36,
"r_x2": 430.75,
"r_y2": 432.04,
"r_x3": 424.43,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 438.36,
"r_x1": 443.7,
"r_y1": 438.36,
"r_x2": 443.7,
"r_y2": 432.04,
"r_x3": 437.38,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 438.36,
"r_x1": 456.65,
"r_y1": 438.36,
"r_x2": 456.65,
"r_y2": 432.04,
"r_x3": 450.33,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 438.36,
"r_x1": 469.61,
"r_y1": 438.36,
"r_x2": 469.61,
"r_y2": 432.04,
"r_x3": 463.29,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 438.36,
"r_x1": 482.56,
"r_y1": 438.36,
"r_x2": 482.56,
"r_y2": 432.04,
"r_x3": 476.24,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 438.36,
"r_x1": 495.51,
"r_y1": 438.36,
"r_x2": 495.51,
"r_y2": 432.04,
"r_x3": 489.19,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 438.36,
"r_x1": 508.46,
"r_y1": 438.36,
"r_x2": 508.46,
"r_y2": 432.04,
"r_x3": 502.14,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.36,
"r_x1": 521.42,
"r_y1": 438.36,
"r_x2": 521.42,
"r_y2": 432.04,
"r_x3": 515.1,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 438.36,
"r_x1": 534.37,
"r_y1": 438.36,
"r_x2": 534.37,
"r_y2": 432.04,
"r_x3": 528.05,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 395.52,
"r_x1": 388.44,
"r_y1": 395.52,
"r_x2": 388.44,
"r_y2": 389.2,
"r_x3": 385.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 395.52,
"r_x1": 401.68,
"r_y1": 395.52,
"r_x2": 401.68,
"r_y2": 389.2,
"r_x3": 398.52,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 395.52,
"r_x1": 414.63,
"r_y1": 395.52,
"r_x2": 414.63,
"r_y2": 389.2,
"r_x3": 411.48,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 395.52,
"r_x1": 427.59,
"r_y1": 395.52,
"r_x2": 427.59,
"r_y2": 389.2,
"r_x3": 424.43,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 395.52,
"r_x1": 440.54,
"r_y1": 395.52,
"r_x2": 440.54,
"r_y2": 389.2,
"r_x3": 437.38,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 395.52,
"r_x1": 453.49,
"r_y1": 395.52,
"r_x2": 453.49,
"r_y2": 389.2,
"r_x3": 450.33,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 395.52,
"r_x1": 466.44,
"r_y1": 395.52,
"r_x2": 466.44,
"r_y2": 389.2,
"r_x3": 463.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 395.52,
"r_x1": 479.39,
"r_y1": 395.52,
"r_x2": 479.39,
"r_y2": 389.2,
"r_x3": 476.24,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 395.52,
"r_x1": 492.35,
"r_y1": 395.52,
"r_x2": 492.35,
"r_y2": 389.2,
"r_x3": 489.19,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 395.52,
"r_x1": 505.3,
"r_y1": 395.52,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.14,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.09,
"r_y0": 395.52,
"r_x1": 521.41,
"r_y1": 395.52,
"r_x2": 521.41,
"r_y2": 389.2,
"r_x3": 515.09,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.04,
"r_y0": 395.52,
"r_x1": 534.13,
"r_y1": 395.52,
"r_x2": 534.13,
"r_y2": 389.2,
"r_x3": 528.04,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 405.29,
"r_x1": 391.6,
"r_y1": 405.29,
"r_x2": 391.6,
"r_y2": 398.97,
"r_x3": 385.28,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 405.29,
"r_x1": 404.84,
"r_y1": 405.29,
"r_x2": 404.84,
"r_y2": 398.97,
"r_x3": 398.52,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 405.29,
"r_x1": 417.8,
"r_y1": 405.29,
"r_x2": 417.8,
"r_y2": 398.97,
"r_x3": 411.48,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 413.09,
"r_x1": 430.75,
"r_y1": 413.09,
"r_x2": 430.75,
"r_y2": 406.77,
"r_x3": 424.43,
"r_y3": 406.77,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.87,
"r_y0": 417.31,
"r_x1": 509.19,
"r_y1": 417.31,
"r_x2": 509.19,
"r_y2": 410.99,
"r_x3": 502.87,
"r_y3": 410.99,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.35,
"r_y0": 386.44,
"r_x1": 430.99,
"r_y1": 386.44,
"r_x2": 430.99,
"r_y2": 381.78,
"r_x3": 384.35,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 169,
"label": "text",
"bbox": {
"l": 437.38,
"t": 400.55,
"r": 443.7,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 406.87,
"r_x1": 443.7,
"r_y1": 406.87,
"r_x2": 443.7,
"r_y2": 400.55,
"r_x3": 437.38,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 170,
"label": "text",
"bbox": {
"l": 450.33,
"t": 400.55,
"r": 456.65,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 406.87,
"r_x1": 456.65,
"r_y1": 406.87,
"r_x2": 456.65,
"r_y2": 400.55,
"r_x3": 450.33,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 171,
"label": "text",
"bbox": {
"l": 463.28,
"t": 400.55,
"r": 469.6,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 406.87,
"r_x1": 469.6,
"r_y1": 406.87,
"r_x2": 469.6,
"r_y2": 400.55,
"r_x3": 463.28,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 172,
"label": "text",
"bbox": {
"l": 476.24,
"t": 400.55,
"r": 482.56,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 406.87,
"r_x1": 482.56,
"r_y1": 406.87,
"r_x2": 482.56,
"r_y2": 400.55,
"r_x3": 476.24,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 173,
"label": "text",
"bbox": {
"l": 489.19,
"t": 400.55,
"r": 495.51,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 406.87,
"r_x1": 495.51,
"r_y1": 406.87,
"r_x2": 495.51,
"r_y2": 400.55,
"r_x3": 489.19,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 174,
"label": "text",
"bbox": {
"l": 502.14,
"t": 400.55,
"r": 508.46,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 406.87,
"r_x1": 508.46,
"r_y1": 406.87,
"r_x2": 508.46,
"r_y2": 400.55,
"r_x3": 502.14,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 175,
"label": "text",
"bbox": {
"l": 515.1,
"t": 400.55,
"r": 521.41,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.87,
"r_x1": 521.41,
"r_y1": 406.87,
"r_x2": 521.41,
"r_y2": 400.55,
"r_x3": 515.1,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 176,
"label": "text",
"bbox": {
"l": 385.28,
"t": 411.04,
"r": 391.6,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 417.36,
"r_x1": 391.6,
"r_y1": 417.36,
"r_x2": 391.6,
"r_y2": 411.04,
"r_x3": 385.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 177,
"label": "text",
"bbox": {
"l": 398.52,
"t": 411.04,
"r": 404.84,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 417.36,
"r_x1": 404.84,
"r_y1": 417.36,
"r_x2": 404.84,
"r_y2": 411.04,
"r_x3": 398.52,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 178,
"label": "text",
"bbox": {
"l": 411.48,
"t": 411.04,
"r": 417.8,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 417.36,
"r_x1": 417.8,
"r_y1": 417.36,
"r_x2": 417.8,
"r_y2": 411.04,
"r_x3": 411.48,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 179,
"label": "text",
"bbox": {
"l": 437.38,
"t": 411.04,
"r": 443.7,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 417.36,
"r_x1": 443.7,
"r_y1": 417.36,
"r_x2": 443.7,
"r_y2": 411.04,
"r_x3": 437.38,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 180,
"label": "text",
"bbox": {
"l": 450.33,
"t": 411.04,
"r": 456.65,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 417.36,
"r_x1": 456.65,
"r_y1": 417.36,
"r_x2": 456.65,
"r_y2": 411.04,
"r_x3": 450.33,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 181,
"label": "text",
"bbox": {
"l": 463.28,
"t": 411.04,
"r": 469.6,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 417.36,
"r_x1": 469.6,
"r_y1": 417.36,
"r_x2": 469.6,
"r_y2": 411.04,
"r_x3": 463.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 182,
"label": "text",
"bbox": {
"l": 385.28,
"t": 421.07,
"r": 391.6,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 427.39,
"r_x1": 391.6,
"r_y1": 427.39,
"r_x2": 391.6,
"r_y2": 421.07,
"r_x3": 385.28,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 183,
"label": "text",
"bbox": {
"l": 398.52,
"t": 421.07,
"r": 404.84,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 427.39,
"r_x1": 404.84,
"r_y1": 427.39,
"r_x2": 404.84,
"r_y2": 421.07,
"r_x3": 398.52,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 184,
"label": "text",
"bbox": {
"l": 411.48,
"t": 421.07,
"r": 417.8,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 427.39,
"r_x1": 417.8,
"r_y1": 427.39,
"r_x2": 417.8,
"r_y2": 421.07,
"r_x3": 411.48,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 185,
"label": "text",
"bbox": {
"l": 424.43,
"t": 421.07,
"r": 430.75,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 427.39,
"r_x1": 430.75,
"r_y1": 427.39,
"r_x2": 430.75,
"r_y2": 421.07,
"r_x3": 424.43,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 186,
"label": "text",
"bbox": {
"l": 437.38,
"t": 421.07,
"r": 443.7,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 427.39,
"r_x1": 443.7,
"r_y1": 427.39,
"r_x2": 443.7,
"r_y2": 421.07,
"r_x3": 437.38,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 187,
"label": "text",
"bbox": {
"l": 450.33,
"t": 421.07,
"r": 456.65,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 427.39,
"r_x1": 456.65,
"r_y1": 427.39,
"r_x2": 456.65,
"r_y2": 421.07,
"r_x3": 450.33,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 188,
"label": "text",
"bbox": {
"l": 463.29,
"t": 421.07,
"r": 469.61,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 427.39,
"r_x1": 469.61,
"r_y1": 427.39,
"r_x2": 469.61,
"r_y2": 421.07,
"r_x3": 463.29,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 189,
"label": "text",
"bbox": {
"l": 476.24,
"t": 421.07,
"r": 482.56,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 427.39,
"r_x1": 482.56,
"r_y1": 427.39,
"r_x2": 482.56,
"r_y2": 421.07,
"r_x3": 476.24,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 190,
"label": "text",
"bbox": {
"l": 489.19,
"t": 421.07,
"r": 495.51,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 427.39,
"r_x1": 495.51,
"r_y1": 427.39,
"r_x2": 495.51,
"r_y2": 421.07,
"r_x3": 489.19,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 191,
"label": "text",
"bbox": {
"l": 502.14,
"t": 421.07,
"r": 508.46,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 427.39,
"r_x1": 508.46,
"r_y1": 427.39,
"r_x2": 508.46,
"r_y2": 421.07,
"r_x3": 502.14,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 192,
"label": "text",
"bbox": {
"l": 515.1,
"t": 421.07,
"r": 521.42,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.39,
"r_x1": 521.42,
"r_y1": 427.39,
"r_x2": 521.42,
"r_y2": 421.07,
"r_x3": 515.1,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 193,
"label": "text",
"bbox": {
"l": 528.05,
"t": 421.07,
"r": 534.37,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 427.39,
"r_x1": 534.37,
"r_y1": 427.39,
"r_x2": 534.37,
"r_y2": 421.07,
"r_x3": 528.05,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 194,
"label": "text",
"bbox": {
"l": 385.28,
"t": 432.04,
"r": 391.6,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 438.36,
"r_x1": 391.6,
"r_y1": 438.36,
"r_x2": 391.6,
"r_y2": 432.04,
"r_x3": 385.28,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 195,
"label": "text",
"bbox": {
"l": 398.52,
"t": 432.04,
"r": 404.84,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 438.36,
"r_x1": 404.84,
"r_y1": 438.36,
"r_x2": 404.84,
"r_y2": 432.04,
"r_x3": 398.52,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 196,
"label": "text",
"bbox": {
"l": 411.48,
"t": 432.04,
"r": 417.8,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 438.36,
"r_x1": 417.8,
"r_y1": 438.36,
"r_x2": 417.8,
"r_y2": 432.04,
"r_x3": 411.48,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 197,
"label": "text",
"bbox": {
"l": 424.43,
"t": 432.04,
"r": 430.75,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 438.36,
"r_x1": 430.75,
"r_y1": 438.36,
"r_x2": 430.75,
"r_y2": 432.04,
"r_x3": 424.43,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 198,
"label": "text",
"bbox": {
"l": 437.38,
"t": 432.04,
"r": 443.7,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 438.36,
"r_x1": 443.7,
"r_y1": 438.36,
"r_x2": 443.7,
"r_y2": 432.04,
"r_x3": 437.38,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 199,
"label": "text",
"bbox": {
"l": 450.33,
"t": 432.04,
"r": 456.65,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 438.36,
"r_x1": 456.65,
"r_y1": 438.36,
"r_x2": 456.65,
"r_y2": 432.04,
"r_x3": 450.33,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 200,
"label": "text",
"bbox": {
"l": 463.29,
"t": 432.04,
"r": 469.61,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 438.36,
"r_x1": 469.61,
"r_y1": 438.36,
"r_x2": 469.61,
"r_y2": 432.04,
"r_x3": 463.29,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 201,
"label": "text",
"bbox": {
"l": 476.24,
"t": 432.04,
"r": 482.56,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 438.36,
"r_x1": 482.56,
"r_y1": 438.36,
"r_x2": 482.56,
"r_y2": 432.04,
"r_x3": 476.24,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 202,
"label": "text",
"bbox": {
"l": 489.19,
"t": 432.04,
"r": 495.51,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 438.36,
"r_x1": 495.51,
"r_y1": 438.36,
"r_x2": 495.51,
"r_y2": 432.04,
"r_x3": 489.19,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 203,
"label": "text",
"bbox": {
"l": 502.14,
"t": 432.04,
"r": 508.46,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 438.36,
"r_x1": 508.46,
"r_y1": 438.36,
"r_x2": 508.46,
"r_y2": 432.04,
"r_x3": 502.14,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 204,
"label": "text",
"bbox": {
"l": 515.1,
"t": 432.04,
"r": 521.42,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.36,
"r_x1": 521.42,
"r_y1": 438.36,
"r_x2": 521.42,
"r_y2": 432.04,
"r_x3": 515.1,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 205,
"label": "text",
"bbox": {
"l": 528.05,
"t": 432.04,
"r": 534.37,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 438.36,
"r_x1": 534.37,
"r_y1": 438.36,
"r_x2": 534.37,
"r_y2": 432.04,
"r_x3": 528.05,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 206,
"label": "text",
"bbox": {
"l": 385.28,
"t": 389.2,
"r": 388.44,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 395.52,
"r_x1": 388.44,
"r_y1": 395.52,
"r_x2": 388.44,
"r_y2": 389.2,
"r_x3": 385.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 207,
"label": "text",
"bbox": {
"l": 398.52,
"t": 389.2,
"r": 401.68,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 395.52,
"r_x1": 401.68,
"r_y1": 395.52,
"r_x2": 401.68,
"r_y2": 389.2,
"r_x3": 398.52,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 208,
"label": "text",
"bbox": {
"l": 411.48,
"t": 389.2,
"r": 414.63,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 395.52,
"r_x1": 414.63,
"r_y1": 395.52,
"r_x2": 414.63,
"r_y2": 389.2,
"r_x3": 411.48,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 209,
"label": "text",
"bbox": {
"l": 424.43,
"t": 389.2,
"r": 427.59,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 395.52,
"r_x1": 427.59,
"r_y1": 395.52,
"r_x2": 427.59,
"r_y2": 389.2,
"r_x3": 424.43,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 210,
"label": "text",
"bbox": {
"l": 437.38,
"t": 389.2,
"r": 440.54,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 395.52,
"r_x1": 440.54,
"r_y1": 395.52,
"r_x2": 440.54,
"r_y2": 389.2,
"r_x3": 437.38,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 211,
"label": "text",
"bbox": {
"l": 450.33,
"t": 389.2,
"r": 453.49,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 395.52,
"r_x1": 453.49,
"r_y1": 395.52,
"r_x2": 453.49,
"r_y2": 389.2,
"r_x3": 450.33,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 212,
"label": "text",
"bbox": {
"l": 463.28,
"t": 389.2,
"r": 466.44,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 395.52,
"r_x1": 466.44,
"r_y1": 395.52,
"r_x2": 466.44,
"r_y2": 389.2,
"r_x3": 463.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 213,
"label": "text",
"bbox": {
"l": 476.24,
"t": 389.2,
"r": 479.39,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 395.52,
"r_x1": 479.39,
"r_y1": 395.52,
"r_x2": 479.39,
"r_y2": 389.2,
"r_x3": 476.24,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 214,
"label": "text",
"bbox": {
"l": 489.19,
"t": 389.2,
"r": 492.35,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 395.52,
"r_x1": 492.35,
"r_y1": 395.52,
"r_x2": 492.35,
"r_y2": 389.2,
"r_x3": 489.19,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 215,
"label": "text",
"bbox": {
"l": 502.14,
"t": 389.2,
"r": 505.3,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 395.52,
"r_x1": 505.3,
"r_y1": 395.52,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.14,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 216,
"label": "text",
"bbox": {
"l": 515.09,
"t": 389.2,
"r": 521.41,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.09,
"r_y0": 395.52,
"r_x1": 521.41,
"r_y1": 395.52,
"r_x2": 521.41,
"r_y2": 389.2,
"r_x3": 515.09,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 217,
"label": "text",
"bbox": {
"l": 528.04,
"t": 389.2,
"r": 534.13,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.04,
"r_y0": 395.52,
"r_x1": 534.13,
"r_y1": 395.52,
"r_x2": 534.13,
"r_y2": 389.2,
"r_x3": 528.04,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 218,
"label": "text",
"bbox": {
"l": 385.28,
"t": 398.97,
"r": 391.6,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 405.29,
"r_x1": 391.6,
"r_y1": 405.29,
"r_x2": 391.6,
"r_y2": 398.97,
"r_x3": 385.28,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 219,
"label": "text",
"bbox": {
"l": 398.52,
"t": 398.97,
"r": 404.84,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 405.29,
"r_x1": 404.84,
"r_y1": 405.29,
"r_x2": 404.84,
"r_y2": 398.97,
"r_x3": 398.52,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 220,
"label": "text",
"bbox": {
"l": 411.48,
"t": 398.97,
"r": 417.8,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 405.29,
"r_x1": 417.8,
"r_y1": 405.29,
"r_x2": 417.8,
"r_y2": 398.97,
"r_x3": 411.48,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 221,
"label": "text",
"bbox": {
"l": 424.43,
"t": 406.77,
"r": 430.75,
"b": 413.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 413.09,
"r_x1": 430.75,
"r_y1": 413.09,
"r_x2": 430.75,
"r_y2": 406.77,
"r_x3": 424.43,
"r_y3": 406.77,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 222,
"label": "text",
"bbox": {
"l": 502.87,
"t": 410.99,
"r": 509.19,
"b": 417.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.87,
"r_y0": 417.31,
"r_x1": 509.19,
"r_y1": 417.31,
"r_x2": 509.19,
"r_y2": 410.99,
"r_x3": 502.87,
"r_y3": 410.99,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 223,
"label": "text",
"bbox": {
"l": 384.35,
"t": 381.78,
"r": 430.99,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.35,
"r_y0": 386.44,
"r_x1": 430.99,
"r_y1": 386.44,
"r_x2": 430.99,
"r_y2": 381.78,
"r_x3": 384.35,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 5,
"page_no": 7,
"cluster": {
"id": 5,
"label": "caption",
"bbox": {
"l": 62.6,
"t": 458.73,
"r": 532.63,
"b": 467.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.915,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.6,
"r_y0": 467.63,
"r_x1": 532.63,
"r_y1": 467.63,
"r_x2": 532.63,
"r_y2": 458.73,
"r_x3": 62.6,
"r_y3": 458.73,
"coord_origin": "TOPLEFT"
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table."
},
{
"label": "section_header",
"id": 2,
"page_no": 7,
"cluster": {
"id": 2,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 491.4,
"r": 163.76,
"b": 501.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 501.25,
"r_x1": 64.45,
"r_y1": 501.25,
"r_x2": 64.45,
"r_y2": 491.4,
"r_x3": 50.11,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "5.5.",
"orig": "5.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.01,
"r_y0": 501.25,
"r_x1": 163.76,
"r_y1": 501.25,
"r_x2": 163.76,
"r_y2": 491.4,
"r_x3": 74.01,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "Qualitative Analysis",
"orig": "Qualitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.5. Qualitative Analysis"
},
{
"label": "text",
"id": 1,
"page_no": 7,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 536.87,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 545.78,
"r_x1": 286.36,
"r_y1": 545.78,
"r_x2": 286.36,
"r_y2": 536.87,
"r_x3": 62.07,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "We showcase several visualizations for the different",
"orig": "We showcase several visualizations for the different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 557.73,
"r_x1": 211.16,
"r_y1": 557.73,
"r_x2": 211.16,
"r_y2": 548.83,
"r_x3": 50.11,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "components of our network on various",
"orig": "components of our network on various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 215.1,
"r_y0": 557.51,
"r_x1": 259.17,
"r_y1": 557.51,
"r_x2": 259.17,
"r_y2": 548.92,
"r_x3": 215.1,
"r_y3": 548.92,
"coord_origin": "TOPLEFT"
},
"text": "\u201ccomplex\u201d",
"orig": "\u201ccomplex\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.12,
"r_y0": 557.73,
"r_x1": 286.36,
"r_y1": 557.73,
"r_x2": 286.36,
"r_y2": 548.83,
"r_x3": 263.12,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "tables",
"orig": "tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 569.69,
"r_x1": 286.37,
"r_y1": 569.69,
"r_x2": 286.37,
"r_y2": 560.78,
"r_x3": 50.11,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "within datasets presented in this work in Fig. 5 and Fig. 6",
"orig": "within datasets presented in this work in Fig. 5 and Fig. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 581.64,
"r_x1": 286.37,
"r_y1": 581.64,
"r_x2": 286.37,
"r_y2": 572.74,
"r_x3": 50.11,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "As it is shown, our model is able to predict bounding boxes",
"orig": "As it is shown, our model is able to predict bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 593.6,
"r_x1": 286.37,
"r_y1": 593.6,
"r_x2": 286.37,
"r_y2": 584.69,
"r_x3": 50.11,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "for all table cells, even for the empty ones. Additionally,",
"orig": "for all table cells, even for the empty ones. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 605.56,
"r_x1": 286.37,
"r_y1": 605.56,
"r_x2": 286.37,
"r_y2": 596.65,
"r_x3": 50.11,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "our post-processing techniques can extract the cell content",
"orig": "our post-processing techniques can extract the cell content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 617.51,
"r_x1": 286.37,
"r_y1": 617.51,
"r_x2": 286.37,
"r_y2": 608.6,
"r_x3": 50.11,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "by matching the predicted bounding boxes to the PDF cells",
"orig": "by matching the predicted bounding boxes to the PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 629.47,
"r_x1": 286.37,
"r_y1": 629.47,
"r_x2": 286.37,
"r_y2": 620.56,
"r_x3": 50.11,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "based on their overlap and spatial proximity. The left part",
"orig": "based on their overlap and spatial proximity. The left part",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 641.42,
"r_x1": 286.37,
"r_y1": 641.42,
"r_x2": 286.37,
"r_y2": 632.51,
"r_x3": 50.11,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "of Fig. 5 demonstrates also the adaptability of our method",
"orig": "of Fig. 5 demonstrates also the adaptability of our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "to any language, as it can successfully extract Japanese",
"orig": "to any language, as it can successfully extract Japanese",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 50.11,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "text, although the training set contains only English content.",
"orig": "text, although the training set contains only English content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "We provide more visualizations including the intermediate",
"orig": "We provide more visualizations including the intermediate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "steps in the supplementary material. Overall these illustra-",
"orig": "steps in the supplementary material. Overall these illustra-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "tions justify the versatility of our method across a diverse",
"orig": "tions justify the versatility of our method across a diverse",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 226.89,
"r_y1": 713.15,
"r_x2": 226.89,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "range of table appearances and content type.",
"orig": "range of table appearances and content type.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We showcase several visualizations for the different components of our network on various \"complex\" tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type."
},
{
"label": "section_header",
"id": 4,
"page_no": 7,
"cluster": {
"id": 4,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 490.71,
"r": 460.85,
"b": 501.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.944,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 501.46,
"r_x1": 316.07,
"r_y1": 501.46,
"r_x2": 316.07,
"r_y2": 490.71,
"r_x3": 308.86,
"r_y3": 490.71,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.69,
"r_y0": 501.46,
"r_x1": 460.85,
"r_y1": 501.46,
"r_x2": 460.85,
"r_y2": 490.71,
"r_x3": 325.69,
"r_y3": 490.71,
"coord_origin": "TOPLEFT"
},
"text": "Future Work & Conclusion",
"orig": "Future Work & Conclusion",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6. Future Work & Conclusion"
},
{
"label": "text",
"id": 0,
"page_no": 7,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 512.89,
"r": 545.12,
"b": 653.31,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 521.8,
"r_x1": 545.12,
"r_y1": 521.8,
"r_x2": 545.12,
"r_y2": 512.89,
"r_x3": 320.82,
"r_y3": 512.89,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we presented TableFormer an end-to-end",
"orig": "In this paper, we presented TableFormer an end-to-end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.75,
"r_x1": 545.12,
"r_y1": 533.75,
"r_x2": 545.12,
"r_y2": 524.85,
"r_x3": 308.86,
"r_y3": 524.85,
"coord_origin": "TOPLEFT"
},
"text": "transformer based approach to predict table structures and",
"orig": "transformer based approach to predict table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.71,
"r_x1": 545.12,
"r_y1": 545.71,
"r_x2": 545.12,
"r_y2": 536.8,
"r_x3": 308.86,
"r_y3": 536.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes of cells from an image. This approach en-",
"orig": "bounding boxes of cells from an image. This approach en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.66,
"r_x1": 545.12,
"r_y1": 557.66,
"r_x2": 545.12,
"r_y2": 548.76,
"r_x3": 308.86,
"r_y3": 548.76,
"coord_origin": "TOPLEFT"
},
"text": "ables us to recreate the table structure, and extract the cell",
"orig": "ables us to recreate the table structure, and extract the cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.62,
"r_x1": 545.12,
"r_y1": 569.62,
"r_x2": 545.12,
"r_y2": 560.71,
"r_x3": 308.86,
"r_y3": 560.71,
"coord_origin": "TOPLEFT"
},
"text": "content from PDF or OCR by using bounding boxes. Ad-",
"orig": "content from PDF or OCR by using bounding boxes. Ad-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.57,
"r_x1": 545.12,
"r_y1": 581.57,
"r_x2": 545.12,
"r_y2": 572.67,
"r_x3": 308.86,
"r_y3": 572.67,
"coord_origin": "TOPLEFT"
},
"text": "ditionally, it provides the versatility required in real-world",
"orig": "ditionally, it provides the versatility required in real-world",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.53,
"r_x1": 545.12,
"r_y1": 593.53,
"r_x2": 545.12,
"r_y2": 584.62,
"r_x3": 308.86,
"r_y3": 584.62,
"coord_origin": "TOPLEFT"
},
"text": "scenarios when dealing with various types of PDF docu-",
"orig": "scenarios when dealing with various types of PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.49,
"r_x1": 400.47,
"r_y1": 605.49,
"r_x2": 400.47,
"r_y2": 596.58,
"r_x3": 308.86,
"r_y3": 596.58,
"coord_origin": "TOPLEFT"
},
"text": "ments, and languages.",
"orig": "ments, and languages.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.38,
"r_y0": 605.49,
"r_x1": 545.12,
"r_y1": 605.49,
"r_x2": 545.12,
"r_y2": 596.58,
"r_x3": 408.38,
"r_y3": 596.58,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, our method outper-",
"orig": "Furthermore, our method outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.44,
"r_x1": 545.12,
"r_y1": 617.44,
"r_x2": 545.12,
"r_y2": 608.53,
"r_x3": 308.86,
"r_y3": 608.53,
"coord_origin": "TOPLEFT"
},
"text": "forms all state-of-the-arts with a wide margin. Finally, we",
"orig": "forms all state-of-the-arts with a wide margin. Finally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.4,
"r_x1": 545.12,
"r_y1": 629.4,
"r_x2": 545.12,
"r_y2": 620.49,
"r_x3": 308.86,
"r_y3": 620.49,
"coord_origin": "TOPLEFT"
},
"text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.35,
"r_x1": 545.12,
"r_y1": 641.35,
"r_x2": 545.12,
"r_y2": 632.44,
"r_x3": 308.86,
"r_y3": 632.44,
"coord_origin": "TOPLEFT"
},
"text": "erated dataset that reinforces missing characteristics from",
"orig": "erated dataset that reinforces missing characteristics from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.31,
"r_x1": 365.86,
"r_y1": 653.31,
"r_x2": 365.86,
"r_y2": 644.4,
"r_x3": 308.86,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "other datasets.",
"orig": "other datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce \"SynthTabNet\" a challenging synthetically generated dataset that reinforces missing characteristics from other datasets."
},
{
"label": "section_header",
"id": 3,
"page_no": 7,
"cluster": {
"id": 3,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 672.1,
"r": 364.41,
"b": 682.85,
"coord_origin": "TOPLEFT"
},
"confidence": 0.944,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 682.85,
"r_x1": 364.41,
"r_y1": 682.85,
"r_x2": 364.41,
"r_y2": 672.1,
"r_x3": 308.86,
"r_y3": 672.1,
"coord_origin": "TOPLEFT"
},
"text": "References",
"orig": "References",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "References"
},
{
"label": "list_item",
"id": 10,
"page_no": 7,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 313.35,
"t": 693.96,
"r": 545.11,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.832,
"cells": [
{
"index": 217,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.35,
"r_y0": 701.98,
"r_x1": 323.81,
"r_y1": 701.98,
"r_x2": 323.81,
"r_y2": 693.96,
"r_x3": 313.35,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "[1]",
"orig": "[1]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 218,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.05,
"r_y0": 701.98,
"r_x1": 545.11,
"r_y1": 701.98,
"r_x2": 545.11,
"r_y2": 693.96,
"r_x3": 326.05,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 219,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 712.94,
"r_x1": 545.11,
"r_y1": 712.94,
"r_x2": 545.11,
"r_y2": 704.92,
"r_x3": 328.78,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-"
},
{
"label": "page_footer",
"id": 9,
"page_no": 7,
"cluster": {
"id": 9,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.871,
"cells": [
{
"index": 220,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "8"
},
{
"label": "picture",
"id": 15,
"page_no": 7,
"cluster": {
"id": 15,
"label": "picture",
"bbox": {
"l": 305.58,
"t": 98.65,
"r": 554.83,
"b": 180.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 14,
"page_no": 7,
"cluster": {
"id": 14,
"label": "picture",
"bbox": {
"l": 49.98,
"t": 103.71,
"r": 301.63,
"b": 187.58,
"coord_origin": "TOPLEFT"
},
"confidence": 0.787,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"body": [
{
"label": "caption",
"id": 18,
"page_no": 7,
"cluster": {
"id": 18,
"label": "caption",
"bbox": {
"l": 53.81,
"t": 208.23,
"r": 385.93,
"b": 216.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.599,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.81,
"r_y0": 216.11,
"r_x1": 62.22,
"r_y1": 216.11,
"r_x2": 62.22,
"r_y2": 208.23,
"r_x3": 53.81,
"r_y3": 208.23,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.42,
"r_y0": 216.11,
"r_x1": 385.93,
"r_y1": 216.11,
"r_x2": 385.93,
"r_y2": 208.23,
"r_x3": 66.42,
"r_y3": 208.23,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:"
},
{
"label": "section_header",
"id": 29,
"page_no": 7,
"cluster": {
"id": 29,
"label": "section_header",
"bbox": {
"l": 53.81,
"t": 94.28,
"r": 284.35,
"b": 102.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.465,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.81,
"r_y0": 102.15,
"r_x1": 284.35,
"r_y1": 102.15,
"r_x2": 284.35,
"r_y2": 94.28,
"r_x3": 53.81,
"r_y3": 94.28,
"coord_origin": "TOPLEFT"
},
"text": "Japanese language (previously unseen by TableFormer):",
"orig": "Japanese language (previously unseen by TableFormer):",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Japanese language (previously unseen by TableFormer):"
},
{
"label": "section_header",
"id": 31,
"page_no": 7,
"cluster": {
"id": 31,
"label": "section_header",
"bbox": {
"l": 304.83,
"t": 94.28,
"r": 431.09,
"b": 102.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.463,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 304.83,
"r_y0": 102.15,
"r_x1": 431.09,
"r_y1": 102.15,
"r_x2": 431.09,
"r_y2": 94.28,
"r_x3": 304.83,
"r_y3": 94.28,
"coord_origin": "TOPLEFT"
},
"text": "Example table from FinTabNet:",
"orig": "Example table from FinTabNet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Example table from FinTabNet:"
},
{
"label": "list_item",
"id": 20,
"page_no": 7,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 53.29,
"t": 78.69,
"r": 61.55,
"b": 86.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.582,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.29,
"r_y0": 86.56,
"r_x1": 61.55,
"r_y1": 86.56,
"r_x2": 61.55,
"r_y2": 78.69,
"r_x3": 53.29,
"r_y3": 78.69,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "a."
},
{
"label": "list_item",
"id": 21,
"page_no": 7,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 65.68,
"t": 78.69,
"r": 499.56,
"b": 86.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.541,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.68,
"r_y0": 86.56,
"r_x1": 499.56,
"r_y1": 86.56,
"r_x2": 499.56,
"r_y2": 78.69,
"r_x3": 65.68,
"r_y3": 78.69,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells"
},
{
"label": "table",
"id": 8,
"page_no": 7,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 53.63,
"t": 218.95,
"r": 298.56,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 55,
"label": "text",
"bbox": {
"l": 209.93,
"t": 222.18,
"r": 241.04,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.93,
"r_y0": 226.36,
"r_x1": 241.04,
"r_y1": 226.36,
"r_x2": 241.04,
"r_y2": 222.18,
"r_x3": 209.93,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 263.76,
"t": 222.18,
"r": 284.51,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.76,
"r_y0": 226.36,
"r_x1": 284.51,
"r_y1": 226.36,
"r_x2": 284.51,
"r_y2": 222.18,
"r_x3": 263.76,
"r_y3": 222.18,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 110.25,
"t": 229.67,
"r": 120.62,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.25,
"r_y0": 233.85,
"r_x1": 120.62,
"r_y1": 233.85,
"r_x2": 120.62,
"r_y2": 229.67,
"r_x3": 110.25,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 175.37,
"t": 229.67,
"r": 196.11,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.37,
"r_y0": 233.85,
"r_x1": 196.11,
"r_y1": 233.85,
"r_x2": 196.11,
"r_y2": 229.67,
"r_x3": 175.37,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 196.11,
"t": 229.67,
"r": 201.29,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.11,
"r_y0": 233.85,
"r_x1": 201.29,
"r_y1": 233.85,
"r_x2": 201.29,
"r_y2": 229.67,
"r_x3": 196.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 209.62,
"t": 229.67,
"r": 219.99,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.62,
"r_y0": 233.85,
"r_x1": 219.99,
"r_y1": 233.85,
"r_x2": 219.99,
"r_y2": 229.67,
"r_x3": 209.62,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 229.2,
"t": 229.67,
"r": 244.75,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.85,
"r_x1": 244.75,
"r_y1": 233.85,
"r_x2": 244.75,
"r_y2": 229.67,
"r_x3": 229.2,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 256.11,
"t": 229.67,
"r": 266.48,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.11,
"r_y0": 233.85,
"r_x1": 266.48,
"r_y1": 233.85,
"r_x2": 266.48,
"r_y2": 229.67,
"r_x3": 256.11,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 278.38,
"t": 229.67,
"r": 293.94,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.38,
"r_y0": 233.85,
"r_x1": 293.94,
"r_y1": 233.85,
"r_x2": 293.94,
"r_y2": 229.67,
"r_x3": 278.38,
"r_y3": 229.67,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 55.53,
"t": 236.43,
"r": 162.71,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 240.78,
"r_x1": 162.71,
"r_y1": 240.78,
"r_x2": 162.71,
"r_y2": 236.43,
"r_x3": 55.53,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 184.4,
"t": 236.43,
"r": 189.56,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.78,
"r_x1": 189.56,
"r_y1": 240.78,
"r_x2": 189.56,
"r_y2": 236.43,
"r_x3": 184.4,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 208.99,
"t": 236.43,
"r": 214.16,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 240.78,
"r_x1": 214.16,
"r_y1": 240.78,
"r_x2": 214.16,
"r_y2": 236.43,
"r_x3": 208.99,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 234.88,
"t": 236.43,
"r": 237.46,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 240.78,
"r_x1": 237.46,
"r_y1": 240.78,
"r_x2": 237.46,
"r_y2": 236.43,
"r_x3": 234.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 256.88,
"t": 236.43,
"r": 264.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 240.78,
"r_x1": 264.64,
"r_y1": 240.78,
"r_x2": 264.64,
"r_y2": 236.43,
"r_x3": 256.88,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 284.06,
"t": 236.43,
"r": 286.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 240.78,
"r_x1": 286.64,
"r_y1": 240.78,
"r_x2": 286.64,
"r_y2": 236.43,
"r_x3": 284.06,
"r_y3": 236.43,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 55.53,
"t": 242.62,
"r": 139.72,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 246.98,
"r_x1": 139.72,
"r_y1": 246.98,
"r_x2": 139.72,
"r_y2": 242.62,
"r_x3": 55.53,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 183.11,
"t": 242.62,
"r": 190.86,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 246.98,
"r_x1": 190.86,
"r_y1": 246.98,
"r_x2": 190.86,
"r_y2": 242.62,
"r_x3": 183.11,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 207.7,
"t": 242.62,
"r": 215.45,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 246.98,
"r_x1": 215.45,
"r_y1": 246.98,
"r_x2": 215.45,
"r_y2": 242.62,
"r_x3": 207.7,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 234.88,
"t": 242.62,
"r": 237.46,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.88,
"r_y0": 246.98,
"r_x1": 237.46,
"r_y1": 246.98,
"r_x2": 237.46,
"r_y2": 242.62,
"r_x3": 234.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 256.88,
"t": 242.62,
"r": 264.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 246.98,
"r_x1": 264.64,
"r_y1": 246.98,
"r_x2": 264.64,
"r_y2": 242.62,
"r_x3": 256.88,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 284.06,
"t": 242.62,
"r": 286.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.06,
"r_y0": 246.98,
"r_x1": 286.64,
"r_y1": 246.98,
"r_x2": 286.64,
"r_y2": 242.62,
"r_x3": 284.06,
"r_y3": 242.62,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 55.53,
"t": 249.8,
"r": 97.01,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 253.98,
"r_x1": 97.01,
"r_y1": 253.98,
"r_x2": 97.01,
"r_y2": 249.8,
"r_x3": 55.53,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 92.7,
"t": 249.59,
"r": 103.03,
"b": 253.95,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.95,
"r_x1": 103.03,
"r_y1": 253.95,
"r_x2": 103.03,
"r_y2": 249.59,
"r_x3": 92.7,
"r_y3": 249.59,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 103.03,
"t": 249.8,
"r": 128.96,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.03,
"r_y0": 253.98,
"r_x1": 128.96,
"r_y1": 253.98,
"r_x2": 128.96,
"r_y2": 249.8,
"r_x3": 103.03,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 183.11,
"t": 248.82,
"r": 190.86,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 253.17,
"r_x1": 190.86,
"r_y1": 253.17,
"r_x2": 190.86,
"r_y2": 248.82,
"r_x3": 183.11,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 210.28,
"t": 248.82,
"r": 212.87,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 253.17,
"r_x1": 212.87,
"r_y1": 253.17,
"r_x2": 212.87,
"r_y2": 248.82,
"r_x3": 210.28,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 232.29,
"t": 248.82,
"r": 240.04,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 253.17,
"r_x1": 240.04,
"r_y1": 253.17,
"r_x2": 240.04,
"r_y2": 248.82,
"r_x3": 232.29,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 256.88,
"t": 248.82,
"r": 264.64,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 253.17,
"r_x1": 264.64,
"r_y1": 253.17,
"r_x2": 264.64,
"r_y2": 248.82,
"r_x3": 256.88,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 281.48,
"t": 248.82,
"r": 289.23,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 253.17,
"r_x1": 289.23,
"r_y1": 253.17,
"r_x2": 289.23,
"r_y2": 248.82,
"r_x3": 281.48,
"r_y3": 248.82,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 55.53,
"t": 257.28,
"r": 91.83,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 261.47,
"r_x1": 91.83,
"r_y1": 261.47,
"r_x2": 91.83,
"r_y2": 257.28,
"r_x3": 55.53,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 88.05,
"t": 257.07,
"r": 93.22,
"b": 261.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.05,
"r_y0": 261.43,
"r_x1": 93.22,
"r_y1": 261.43,
"r_x2": 93.22,
"r_y2": 257.07,
"r_x3": 88.05,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 93.22,
"t": 257.28,
"r": 119.15,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.22,
"r_y0": 261.47,
"r_x1": 119.15,
"r_y1": 261.47,
"r_x2": 119.15,
"r_y2": 257.28,
"r_x3": 93.22,
"r_y3": 257.28,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 116.45,
"t": 257.07,
"r": 129.88,
"b": 261.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 261.43,
"r_x1": 129.88,
"r_y1": 261.43,
"r_x2": 129.88,
"r_y2": 257.07,
"r_x3": 116.45,
"r_y3": 257.07,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 183.11,
"t": 256.3,
"r": 190.86,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 260.66,
"r_x1": 190.86,
"r_y1": 260.66,
"r_x2": 190.86,
"r_y2": 256.3,
"r_x3": 183.11,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 210.28,
"t": 256.3,
"r": 212.87,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 260.66,
"r_x1": 212.87,
"r_y1": 260.66,
"r_x2": 212.87,
"r_y2": 256.3,
"r_x3": 210.28,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 232.29,
"t": 256.3,
"r": 240.04,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 260.66,
"r_x1": 240.04,
"r_y1": 260.66,
"r_x2": 240.04,
"r_y2": 256.3,
"r_x3": 232.29,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 256.88,
"t": 256.3,
"r": 264.64,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 260.66,
"r_x1": 264.64,
"r_y1": 260.66,
"r_x2": 264.64,
"r_y2": 256.3,
"r_x3": 256.88,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 281.48,
"t": 256.3,
"r": 289.23,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 260.66,
"r_x1": 289.23,
"r_y1": 260.66,
"r_x2": 289.23,
"r_y2": 256.3,
"r_x3": 281.48,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 55.53,
"t": 264.51,
"r": 60.72,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 268.69,
"r_x1": 60.72,
"r_y1": 268.69,
"r_x2": 60.72,
"r_y2": 264.51,
"r_x3": 55.53,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 60.18,
"t": 264.3,
"r": 65.34,
"b": 268.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.18,
"r_y0": 268.66,
"r_x1": 65.34,
"r_y1": 268.66,
"r_x2": 65.34,
"r_y2": 264.3,
"r_x3": 60.18,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 65.34,
"t": 264.51,
"r": 122.38,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.34,
"r_y0": 268.69,
"r_x1": 122.38,
"r_y1": 268.69,
"r_x2": 122.38,
"r_y2": 264.51,
"r_x3": 65.34,
"r_y3": 264.51,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 116.45,
"t": 264.3,
"r": 129.88,
"b": 268.66,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.45,
"r_y0": 268.66,
"r_x1": 129.88,
"r_y1": 268.66,
"r_x2": 129.88,
"r_y2": 264.3,
"r_x3": 116.45,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 183.11,
"t": 263.53,
"r": 190.86,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 267.89,
"r_x1": 190.86,
"r_y1": 267.89,
"r_x2": 190.86,
"r_y2": 263.53,
"r_x3": 183.11,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 210.28,
"t": 263.53,
"r": 212.87,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 267.89,
"r_x1": 212.87,
"r_y1": 267.89,
"r_x2": 212.87,
"r_y2": 263.53,
"r_x3": 210.28,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 232.29,
"t": 263.53,
"r": 240.04,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 267.89,
"r_x1": 240.04,
"r_y1": 267.89,
"r_x2": 240.04,
"r_y2": 263.53,
"r_x3": 232.29,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 256.88,
"t": 263.53,
"r": 264.64,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 267.89,
"r_x1": 264.64,
"r_y1": 267.89,
"r_x2": 264.64,
"r_y2": 263.53,
"r_x3": 256.88,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 281.48,
"t": 263.53,
"r": 289.23,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 267.89,
"r_x1": 289.23,
"r_y1": 267.89,
"r_x2": 289.23,
"r_y2": 263.53,
"r_x3": 281.48,
"r_y3": 263.53,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 55.53,
"t": 271.74,
"r": 107.38,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 275.92,
"r_x1": 107.38,
"r_y1": 275.92,
"r_x2": 107.38,
"r_y2": 271.74,
"r_x3": 55.53,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 101.99,
"t": 271.53,
"r": 109.74,
"b": 275.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.99,
"r_y0": 275.89,
"r_x1": 109.74,
"r_y1": 275.89,
"r_x2": 109.74,
"r_y2": 271.53,
"r_x3": 101.99,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 109.74,
"t": 271.74,
"r": 114.93,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.74,
"r_y0": 275.92,
"r_x1": 114.93,
"r_y1": 275.92,
"r_x2": 114.93,
"r_y2": 271.74,
"r_x3": 109.74,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 114.39,
"t": 271.53,
"r": 122.14,
"b": 275.89,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.39,
"r_y0": 275.89,
"r_x1": 122.14,
"r_y1": 275.89,
"r_x2": 122.14,
"r_y2": 271.53,
"r_x3": 114.39,
"r_y3": 271.53,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 122.14,
"t": 271.74,
"r": 127.32,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.14,
"r_y0": 275.92,
"r_x1": 127.32,
"r_y1": 275.92,
"r_x2": 127.32,
"r_y2": 271.74,
"r_x3": 122.14,
"r_y3": 271.74,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 184.4,
"t": 270.75,
"r": 189.56,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.11,
"r_x1": 189.56,
"r_y1": 275.11,
"r_x2": 189.56,
"r_y2": 270.75,
"r_x3": 184.4,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 210.28,
"t": 270.75,
"r": 212.87,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.28,
"r_y0": 275.11,
"r_x1": 212.87,
"r_y1": 275.11,
"r_x2": 212.87,
"r_y2": 270.75,
"r_x3": 210.28,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 233.58,
"t": 270.75,
"r": 238.75,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 275.11,
"r_x1": 238.75,
"r_y1": 275.11,
"r_x2": 238.75,
"r_y2": 270.75,
"r_x3": 233.58,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 256.88,
"t": 270.75,
"r": 264.64,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 275.11,
"r_x1": 264.64,
"r_y1": 275.11,
"r_x2": 264.64,
"r_y2": 270.75,
"r_x3": 256.88,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 281.48,
"t": 270.75,
"r": 289.23,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 275.11,
"r_x1": 289.23,
"r_y1": 275.11,
"r_x2": 289.23,
"r_y2": 270.75,
"r_x3": 281.48,
"r_y3": 270.75,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 55.53,
"t": 279.01,
"r": 68.69,
"b": 283.37,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.53,
"r_y0": 283.37,
"r_x1": 68.69,
"r_y1": 283.37,
"r_x2": 68.69,
"r_y2": 279.01,
"r_x3": 55.53,
"r_y3": 279.01,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 68.69,
"t": 279.22,
"r": 110.17,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.69,
"r_y0": 283.4,
"r_x1": 110.17,
"r_y1": 283.4,
"r_x2": 110.17,
"r_y2": 279.22,
"r_x3": 68.69,
"r_y3": 279.22,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 183.11,
"t": 277.98,
"r": 190.86,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 282.34,
"r_x1": 190.86,
"r_y1": 282.34,
"r_x2": 190.86,
"r_y2": 277.98,
"r_x3": 183.11,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 208.99,
"t": 277.98,
"r": 214.16,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.99,
"r_y0": 282.34,
"r_x1": 214.16,
"r_y1": 282.34,
"r_x2": 214.16,
"r_y2": 277.98,
"r_x3": 208.99,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 233.58,
"t": 277.98,
"r": 238.75,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.58,
"r_y0": 282.34,
"r_x1": 238.75,
"r_y1": 282.34,
"r_x2": 238.75,
"r_y2": 277.98,
"r_x3": 233.58,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 256.88,
"t": 277.98,
"r": 264.64,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.88,
"r_y0": 282.34,
"r_x1": 264.64,
"r_y1": 282.34,
"r_x2": 264.64,
"r_y2": 277.98,
"r_x3": 256.88,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 282.77,
"t": 277.98,
"r": 287.94,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.77,
"r_y0": 282.34,
"r_x1": 287.94,
"r_y1": 282.34,
"r_x2": 287.94,
"r_y2": 277.98,
"r_x3": 282.77,
"r_y3": 277.98,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 169.62,
"t": 286.45,
"r": 174.8,
"b": 290.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.62,
"r_y0": 290.63,
"r_x1": 174.8,
"r_y1": 290.63,
"r_x2": 174.8,
"r_y2": 286.45,
"r_x3": 169.62,
"r_y3": 286.45,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 183.11,
"t": 285.47,
"r": 190.86,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.11,
"r_y0": 289.82,
"r_x1": 190.86,
"r_y1": 289.82,
"r_x2": 190.86,
"r_y2": 285.47,
"r_x3": 183.11,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 207.7,
"t": 285.47,
"r": 215.45,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.82,
"r_x1": 215.45,
"r_y1": 289.82,
"r_x2": 215.45,
"r_y2": 285.47,
"r_x3": 207.7,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 232.29,
"t": 285.47,
"r": 240.04,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.29,
"r_y0": 289.82,
"r_x1": 240.04,
"r_y1": 289.82,
"r_x2": 240.04,
"r_y2": 285.47,
"r_x3": 232.29,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 255.77,
"t": 285.47,
"r": 265.75,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.77,
"r_y0": 289.82,
"r_x1": 265.75,
"r_y1": 289.82,
"r_x2": 265.75,
"r_y2": 285.47,
"r_x3": 255.77,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 281.48,
"t": 285.47,
"r": 289.23,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.48,
"r_y0": 289.82,
"r_x1": 289.23,
"r_y1": 289.82,
"r_x2": 289.23,
"r_y2": 285.47,
"r_x3": 281.48,
"r_y3": 285.47,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 10,
"num_cols": 6,
"table_cells": [
{
"bbox": {
"l": 209.93,
"t": 222.18,
"r": 241.04,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 4,
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 263.76,
"t": 222.18,
"r": 284.51,
"b": 226.36,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 6,
"text": "\u53c2\u8003\u6587\u732e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 110.25,
"t": 229.67,
"r": 120.62,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u51fa\u5178",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 175.37,
"t": 229.67,
"r": 196.11,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "\u30d5\u30a1\u30a4\u30eb \u6570",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.62,
"t": 229.67,
"r": 219.99,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 229.2,
"t": 229.67,
"r": 244.75,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.11,
"t": 229.67,
"r": 266.48,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 278.38,
"t": 229.67,
"r": 293.94,
"b": 233.85,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 236.43,
"r": 162.71,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Association for Computational Linguistics(ACL2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 236.43,
"r": 189.56,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 208.99,
"t": 236.43,
"r": 214.16,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.88,
"t": 236.43,
"r": 237.46,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 236.43,
"r": 264.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.06,
"t": 236.43,
"r": 286.64,
"b": 240.78,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 242.62,
"r": 139.72,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Computational Linguistics(COLING2002)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 242.62,
"r": 190.86,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 242.62,
"r": 215.45,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.88,
"t": 242.62,
"r": 237.46,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 242.62,
"r": 264.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.06,
"t": 242.62,
"r": 286.64,
"b": 246.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 249.8,
"r": 97.01,
"b": 253.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 248.82,
"r": 190.86,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 248.82,
"r": 212.87,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 248.82,
"r": 240.04,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "142",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 248.82,
"r": 264.64,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "223",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 248.82,
"r": 289.23,
"b": 253.17,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 257.28,
"r": 91.83,
"b": 261.47,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 256.3,
"r": 190.86,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "177",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 256.3,
"r": 212.87,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 256.3,
"r": 240.04,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "176",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 256.3,
"r": 264.64,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 256.3,
"r": 289.23,
"b": 260.66,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "236",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 264.51,
"r": 60.72,
"b": 268.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 263.53,
"r": 190.86,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "208",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 263.53,
"r": 212.87,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 263.53,
"r": 240.04,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "203",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 263.53,
"r": 264.64,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "152",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 263.53,
"r": 289.23,
"b": 267.89,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "244",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 271.74,
"r": 107.38,
"b": 275.92,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 270.75,
"r": 189.56,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "98",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.28,
"t": 270.75,
"r": 212.87,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.58,
"t": 270.75,
"r": 238.75,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 270.75,
"r": 264.64,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 270.75,
"r": 289.23,
"b": 275.11,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "232",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.53,
"t": 279.01,
"r": 68.69,
"b": 283.37,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 277.98,
"r": 190.86,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "107",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 208.99,
"t": 277.98,
"r": 214.16,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "73",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.58,
"t": 277.98,
"r": 238.75,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "34",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.88,
"t": 277.98,
"r": 264.64,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 282.77,
"t": 277.98,
"r": 287.94,
"b": 282.34,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 169.62,
"t": 286.45,
"r": 174.8,
"b": 290.63,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u8a08",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.11,
"t": 285.47,
"r": 190.86,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "945",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 285.47,
"r": 215.45,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "294",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.29,
"t": 285.47,
"r": 240.04,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "651",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 255.77,
"t": 285.47,
"r": 265.75,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "1122",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.48,
"t": 285.47,
"r": 289.23,
"b": 289.82,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "955",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 16,
"page_no": 7,
"cluster": {
"id": 16,
"label": "caption",
"bbox": {
"l": 380.43,
"t": 292.3,
"r": 549.42,
"b": 298.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.43,
"r_y0": 298.6,
"r_x1": 549.42,
"r_y1": 298.6,
"r_x2": 549.42,
"r_y2": 292.3,
"r_x3": 380.43,
"r_y3": 292.3,
"coord_origin": "TOPLEFT"
},
"text": "Text is aligned to match original for ease of viewing",
"orig": "Text is aligned to match original for ease of viewing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Text is aligned to match original for ease of viewing"
},
{
"label": "table",
"id": 7,
"page_no": 7,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 304.92,
"t": 218.51,
"r": 550.23,
"b": 287.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 125,
"label": "text",
"bbox": {
"l": 459.05,
"t": 221.62,
"r": 542.0,
"b": 226.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.05,
"r_y0": 226.69,
"r_x1": 542.0,
"r_y1": 226.69,
"r_x2": 542.0,
"r_y2": 221.62,
"r_x3": 459.05,
"r_y3": 221.62,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 493.82,
"t": 227.83,
"r": 507.23,
"b": 232.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.82,
"r_y0": 232.9,
"r_x1": 507.23,
"r_y1": 232.9,
"r_x2": 507.23,
"r_y2": 227.83,
"r_x3": 493.82,
"r_y3": 227.83,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 393.24,
"t": 236.75,
"r": 400.75,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.24,
"r_y0": 241.81,
"r_x1": 400.75,
"r_y1": 241.81,
"r_x2": 400.75,
"r_y2": 236.75,
"r_x3": 393.24,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 128,
"label": "text",
"bbox": {
"l": 400.75,
"t": 236.75,
"r": 404.65,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 241.81,
"r_x1": 404.65,
"r_y1": 241.81,
"r_x2": 404.65,
"r_y2": 236.75,
"r_x3": 400.75,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 129,
"label": "text",
"bbox": {
"l": 404.65,
"t": 236.75,
"r": 407.35,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.65,
"r_y0": 241.81,
"r_x1": 407.35,
"r_y1": 241.81,
"r_x2": 407.35,
"r_y2": 236.75,
"r_x3": 404.65,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 130,
"label": "text",
"bbox": {
"l": 392.1,
"t": 221.57,
"r": 438.01,
"b": 226.64,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.64,
"r_x1": 438.01,
"r_y1": 226.64,
"r_x2": 438.01,
"r_y2": 221.57,
"r_x3": 392.1,
"r_y3": 221.57,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 131,
"label": "text",
"bbox": {
"l": 427.18,
"t": 236.75,
"r": 440.99,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.18,
"r_y0": 241.81,
"r_x1": 440.99,
"r_y1": 241.81,
"r_x2": 440.99,
"r_y2": 236.75,
"r_x3": 427.18,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 132,
"label": "text",
"bbox": {
"l": 468.38,
"t": 236.75,
"r": 482.48,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.38,
"r_y0": 241.81,
"r_x1": 482.48,
"r_y1": 241.81,
"r_x2": 482.48,
"r_y2": 236.75,
"r_x3": 468.38,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 133,
"label": "text",
"bbox": {
"l": 516.93,
"t": 236.75,
"r": 530.73,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.93,
"r_y0": 241.81,
"r_x1": 530.73,
"r_y1": 241.81,
"r_x2": 530.73,
"r_y2": 236.75,
"r_x3": 516.93,
"r_y3": 236.75,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 134,
"label": "text",
"bbox": {
"l": 306.11,
"t": 244.61,
"r": 355.65,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 249.68,
"r_x1": 355.65,
"r_y1": 249.68,
"r_x2": 355.65,
"r_y2": 244.61,
"r_x3": 306.11,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 135,
"label": "text",
"bbox": {
"l": 355.65,
"t": 244.61,
"r": 364.66,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.65,
"r_y0": 249.68,
"r_x1": 364.66,
"r_y1": 249.68,
"r_x2": 364.66,
"r_y2": 244.61,
"r_x3": 355.65,
"r_y3": 244.61,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 136,
"label": "text",
"bbox": {
"l": 396.25,
"t": 244.91,
"r": 400.75,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 249.98,
"r_x1": 400.75,
"r_y1": 249.98,
"r_x2": 400.75,
"r_y2": 244.91,
"r_x3": 396.25,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 137,
"label": "text",
"bbox": {
"l": 400.75,
"t": 244.91,
"r": 403.76,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 249.98,
"r_x1": 403.76,
"r_y1": 249.98,
"r_x2": 403.76,
"r_y2": 244.91,
"r_x3": 400.75,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 138,
"label": "text",
"bbox": {
"l": 429.82,
"t": 244.91,
"r": 437.33,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 249.98,
"r_x1": 437.33,
"r_y1": 249.98,
"r_x2": 437.33,
"r_y2": 244.91,
"r_x3": 429.82,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 139,
"label": "text",
"bbox": {
"l": 465.53,
"t": 244.91,
"r": 478.4,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.53,
"r_y0": 249.98,
"r_x1": 478.4,
"r_y1": 249.98,
"r_x2": 478.4,
"r_y2": 244.91,
"r_x3": 465.53,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 140,
"label": "text",
"bbox": {
"l": 480.98,
"t": 244.91,
"r": 483.55,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 480.98,
"r_y0": 249.98,
"r_x1": 483.55,
"r_y1": 249.98,
"r_x2": 483.55,
"r_y2": 244.91,
"r_x3": 480.98,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 141,
"label": "text",
"bbox": {
"l": 513.45,
"t": 244.91,
"r": 531.47,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.45,
"r_y0": 249.98,
"r_x1": 531.47,
"r_y1": 249.98,
"r_x2": 531.47,
"r_y2": 244.91,
"r_x3": 513.45,
"r_y3": 244.91,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 142,
"label": "text",
"bbox": {
"l": 306.11,
"t": 253.68,
"r": 325.63,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 258.75,
"r_x1": 325.63,
"r_y1": 258.75,
"r_x2": 325.63,
"r_y2": 253.68,
"r_x3": 306.11,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 143,
"label": "text",
"bbox": {
"l": 396.25,
"t": 253.68,
"r": 400.75,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 258.75,
"r_x1": 400.75,
"r_y1": 258.75,
"r_x2": 400.75,
"r_y2": 253.68,
"r_x3": 396.25,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 144,
"label": "text",
"bbox": {
"l": 400.75,
"t": 253.68,
"r": 403.76,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.75,
"r_y0": 258.75,
"r_x1": 403.76,
"r_y1": 258.75,
"r_x2": 403.76,
"r_y2": 253.68,
"r_x3": 400.75,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 145,
"label": "text",
"bbox": {
"l": 429.82,
"t": 253.68,
"r": 437.33,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.82,
"r_y0": 258.75,
"r_x1": 437.33,
"r_y1": 258.75,
"r_x2": 437.33,
"r_y2": 253.68,
"r_x3": 429.82,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 146,
"label": "text",
"bbox": {
"l": 466.44,
"t": 253.68,
"r": 482.55,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.44,
"r_y0": 258.75,
"r_x1": 482.55,
"r_y1": 258.75,
"r_x2": 482.55,
"r_y2": 253.68,
"r_x3": 466.44,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 147,
"label": "text",
"bbox": {
"l": 514.29,
"t": 253.68,
"r": 530.81,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.29,
"r_y0": 258.75,
"r_x1": 530.81,
"r_y1": 258.75,
"r_x2": 530.81,
"r_y2": 253.68,
"r_x3": 514.29,
"r_y3": 253.68,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 148,
"label": "text",
"bbox": {
"l": 306.11,
"t": 261.55,
"r": 322.63,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 266.61,
"r_x1": 322.63,
"r_y1": 266.61,
"r_x2": 322.63,
"r_y2": 261.55,
"r_x3": 306.11,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 149,
"label": "text",
"bbox": {
"l": 394.43,
"t": 261.55,
"r": 400.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 266.61,
"r_x1": 400.74,
"r_y1": 266.61,
"r_x2": 400.74,
"r_y2": 261.55,
"r_x3": 394.43,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 150,
"label": "text",
"bbox": {
"l": 400.73,
"t": 261.55,
"r": 403.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 266.61,
"r_x1": 403.74,
"r_y1": 266.61,
"r_x2": 403.74,
"r_y2": 261.55,
"r_x3": 400.73,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 151,
"label": "text",
"bbox": {
"l": 403.74,
"t": 261.55,
"r": 405.54,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 266.61,
"r_x1": 405.54,
"r_y1": 266.61,
"r_x2": 405.54,
"r_y2": 261.55,
"r_x3": 403.74,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 152,
"label": "text",
"bbox": {
"l": 427.7,
"t": 261.55,
"r": 438.81,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.61,
"r_x1": 438.81,
"r_y1": 266.61,
"r_x2": 438.81,
"r_y2": 261.55,
"r_x3": 427.7,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 153,
"label": "text",
"bbox": {
"l": 468.56,
"t": 261.55,
"r": 482.07,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.56,
"r_y0": 266.61,
"r_x1": 482.07,
"r_y1": 266.61,
"r_x2": 482.07,
"r_y2": 261.55,
"r_x3": 468.56,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 154,
"label": "text",
"bbox": {
"l": 516.02,
"t": 261.55,
"r": 529.53,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 266.61,
"r_x1": 529.53,
"r_y1": 266.61,
"r_x2": 529.53,
"r_y2": 261.55,
"r_x3": 516.02,
"r_y3": 261.55,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 155,
"label": "text",
"bbox": {
"l": 306.11,
"t": 269.64,
"r": 356.25,
"b": 274.71,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 274.71,
"r_x1": 356.25,
"r_y1": 274.71,
"r_x2": 356.25,
"r_y2": 269.64,
"r_x3": 306.11,
"r_y3": 269.64,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 156,
"label": "text",
"bbox": {
"l": 394.43,
"t": 270.32,
"r": 400.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.43,
"r_y0": 275.38,
"r_x1": 400.74,
"r_y1": 275.38,
"r_x2": 400.74,
"r_y2": 270.32,
"r_x3": 394.43,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 157,
"label": "text",
"bbox": {
"l": 400.73,
"t": 270.32,
"r": 403.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.73,
"r_y0": 275.38,
"r_x1": 403.74,
"r_y1": 275.38,
"r_x2": 403.74,
"r_y2": 270.32,
"r_x3": 400.73,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 158,
"label": "text",
"bbox": {
"l": 403.74,
"t": 270.32,
"r": 405.54,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.74,
"r_y0": 275.38,
"r_x1": 405.54,
"r_y1": 275.38,
"r_x2": 405.54,
"r_y2": 270.32,
"r_x3": 403.74,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 159,
"label": "text",
"bbox": {
"l": 431.03,
"t": 270.32,
"r": 436.43,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.03,
"r_y0": 275.38,
"r_x1": 436.43,
"r_y1": 275.38,
"r_x2": 436.43,
"r_y2": 270.32,
"r_x3": 431.03,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 160,
"label": "text",
"bbox": {
"l": 465.83,
"t": 270.32,
"r": 482.35,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.83,
"r_y0": 275.38,
"r_x1": 482.35,
"r_y1": 275.38,
"r_x2": 482.35,
"r_y2": 270.32,
"r_x3": 465.83,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 161,
"label": "text",
"bbox": {
"l": 516.02,
"t": 270.32,
"r": 529.53,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.02,
"r_y0": 275.38,
"r_x1": 529.53,
"r_y1": 275.38,
"r_x2": 529.53,
"r_y2": 270.32,
"r_x3": 516.02,
"r_y3": 270.32,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 162,
"label": "text",
"bbox": {
"l": 306.11,
"t": 278.49,
"r": 373.36,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.11,
"r_y0": 283.55,
"r_x1": 373.36,
"r_y1": 283.55,
"r_x2": 373.36,
"r_y2": 278.49,
"r_x3": 306.11,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 163,
"label": "text",
"bbox": {
"l": 396.25,
"t": 278.49,
"r": 403.76,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.25,
"r_y0": 283.55,
"r_x1": 403.76,
"r_y1": 283.55,
"r_x2": 403.76,
"r_y2": 278.49,
"r_x3": 396.25,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 164,
"label": "text",
"bbox": {
"l": 429.52,
"t": 278.49,
"r": 437.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.52,
"r_y0": 283.55,
"r_x1": 437.02,
"r_y1": 283.55,
"r_x2": 437.02,
"r_y2": 278.49,
"r_x3": 429.52,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 165,
"label": "text",
"bbox": {
"l": 463.71,
"t": 278.49,
"r": 484.74,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.71,
"r_y0": 283.55,
"r_x1": 484.74,
"r_y1": 283.55,
"r_x2": 484.74,
"r_y2": 278.49,
"r_x3": 463.71,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 166,
"label": "text",
"bbox": {
"l": 512.99,
"t": 278.49,
"r": 534.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.99,
"r_y0": 283.55,
"r_x1": 534.02,
"r_y1": 283.55,
"r_x2": 534.02,
"r_y2": 278.49,
"r_x3": 512.99,
"r_y3": 278.49,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 459.05,
"t": 221.62,
"r": 542.0,
"b": 226.69,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 5,
"text": "Weighted Average Grant Date Fair Value",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 393.24,
"t": 236.75,
"r": 400.75,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "RS U s",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 392.1,
"t": 221.57,
"r": 438.01,
"b": 226.64,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 3,
"text": "Shares (in millions)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.18,
"t": 236.75,
"r": 440.99,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.38,
"t": 236.75,
"r": 482.48,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "RSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.93,
"t": 236.75,
"r": 530.73,
"b": 241.81,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 244.61,
"r": 355.65,
"b": 249.68,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on Janua ry 1",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 244.91,
"r": 400.75,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1. 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.82,
"t": 244.91,
"r": 437.33,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.53,
"t": 244.91,
"r": 478.4,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "90.10 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.45,
"t": 244.91,
"r": 531.47,
"b": 249.98,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 91.19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 253.68,
"r": 325.63,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Granted",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 253.68,
"r": 400.75,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "0. 5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.82,
"t": 253.68,
"r": 437.33,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 466.44,
"t": 253.68,
"r": 482.55,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "117.44",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 514.29,
"t": 253.68,
"r": 530.81,
"b": 258.75,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "122.41",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 261.55,
"r": 322.63,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Vested",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.43,
"t": 261.55,
"r": 400.74,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 5 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.7,
"t": 261.55,
"r": 438.81,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "(0.1)",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.56,
"t": 261.55,
"r": 482.07,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "87.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.02,
"t": 261.55,
"r": 529.53,
"b": 266.61,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "81.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 269.64,
"r": 356.25,
"b": 274.71,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Canceled or forfeited",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.43,
"t": 270.32,
"r": 400.74,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 1 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 431.03,
"t": 270.32,
"r": 436.43,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.83,
"t": 270.32,
"r": 482.35,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "102.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.02,
"t": 270.32,
"r": 529.53,
"b": 275.38,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "92.18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.11,
"t": 278.49,
"r": 373.36,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on December 31",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.25,
"t": 278.49,
"r": 403.76,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.52,
"t": 278.49,
"r": 437.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 463.71,
"t": 278.49,
"r": 484.74,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "104.85 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.99,
"t": 278.49,
"r": 534.02,
"b": 283.55,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 104.51",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 6,
"page_no": 7,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 320.88,
"r": 545.11,
"b": 365.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.914,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 329.78,
"r_x1": 86.86,
"r_y1": 329.78,
"r_x2": 86.86,
"r_y2": 320.88,
"r_x3": 50.11,
"r_y3": 320.88,
"coord_origin": "TOPLEFT"
},
"text": "Figure 5:",
"orig": "Figure 5:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.92,
"r_y0": 329.78,
"r_x1": 545.11,
"r_y1": 329.78,
"r_x2": 545.11,
"r_y2": 320.88,
"r_x3": 93.92,
"r_y3": 320.88,
"coord_origin": "TOPLEFT"
},
"text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 341.74,
"r_x1": 545.11,
"r_y1": 341.74,
"r_x2": 545.11,
"r_y2": 332.83,
"r_x3": 50.11,
"r_y3": 332.83,
"coord_origin": "TOPLEFT"
},
"text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 353.69,
"r_x1": 545.11,
"r_y1": 353.69,
"r_x2": 545.11,
"r_y2": 344.79,
"r_x3": 50.11,
"r_y3": 344.79,
"coord_origin": "TOPLEFT"
},
"text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 365.65,
"r_x1": 139.8,
"r_y1": 365.65,
"r_x2": 139.8,
"r_y2": 356.74,
"r_x3": 50.11,
"r_y3": 356.74,
"coord_origin": "TOPLEFT"
},
"text": "the FinTabNet dataset.",
"orig": "the FinTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset."
},
{
"label": "picture",
"id": 12,
"page_no": 7,
"cluster": {
"id": 12,
"label": "picture",
"bbox": {
"l": 216.77,
"t": 380.49,
"r": 375.78,
"b": 443.35,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.26,
"r_y0": 386.44,
"r_x1": 342.08,
"r_y1": 386.44,
"r_x2": 342.08,
"r_y2": 381.78,
"r_x3": 220.26,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 167,
"label": "text",
"bbox": {
"l": 220.26,
"t": 381.78,
"r": 342.08,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.26,
"r_y0": 386.44,
"r_x1": 342.08,
"r_y1": 386.44,
"r_x2": 342.08,
"r_y2": 381.78,
"r_x3": 220.26,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 11,
"page_no": 7,
"cluster": {
"id": 11,
"label": "picture",
"bbox": {
"l": 51.74,
"t": 380.48,
"r": 211.84,
"b": 443.66,
"coord_origin": "TOPLEFT"
},
"confidence": 0.831,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.72,
"r_y0": 386.44,
"r_x1": 85.66,
"r_y1": 386.44,
"r_x2": 85.66,
"r_y2": 381.78,
"r_x3": 53.72,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 168,
"label": "text",
"bbox": {
"l": 53.72,
"t": 381.78,
"r": 85.66,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.72,
"r_y0": 386.44,
"r_x1": 85.66,
"r_y1": 386.44,
"r_x2": 85.66,
"r_y2": 381.78,
"r_x3": 53.72,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 13,
"page_no": 7,
"cluster": {
"id": 13,
"label": "picture",
"bbox": {
"l": 383.14,
"t": 381.23,
"r": 542.11,
"b": 442.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.788,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 406.87,
"r_x1": 443.7,
"r_y1": 406.87,
"r_x2": 443.7,
"r_y2": 400.55,
"r_x3": 437.38,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 406.87,
"r_x1": 456.65,
"r_y1": 406.87,
"r_x2": 456.65,
"r_y2": 400.55,
"r_x3": 450.33,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 406.87,
"r_x1": 469.6,
"r_y1": 406.87,
"r_x2": 469.6,
"r_y2": 400.55,
"r_x3": 463.28,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 406.87,
"r_x1": 482.56,
"r_y1": 406.87,
"r_x2": 482.56,
"r_y2": 400.55,
"r_x3": 476.24,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 406.87,
"r_x1": 495.51,
"r_y1": 406.87,
"r_x2": 495.51,
"r_y2": 400.55,
"r_x3": 489.19,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 406.87,
"r_x1": 508.46,
"r_y1": 406.87,
"r_x2": 508.46,
"r_y2": 400.55,
"r_x3": 502.14,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.87,
"r_x1": 521.41,
"r_y1": 406.87,
"r_x2": 521.41,
"r_y2": 400.55,
"r_x3": 515.1,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 417.36,
"r_x1": 391.6,
"r_y1": 417.36,
"r_x2": 391.6,
"r_y2": 411.04,
"r_x3": 385.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 417.36,
"r_x1": 404.84,
"r_y1": 417.36,
"r_x2": 404.84,
"r_y2": 411.04,
"r_x3": 398.52,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 417.36,
"r_x1": 417.8,
"r_y1": 417.36,
"r_x2": 417.8,
"r_y2": 411.04,
"r_x3": 411.48,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 417.36,
"r_x1": 443.7,
"r_y1": 417.36,
"r_x2": 443.7,
"r_y2": 411.04,
"r_x3": 437.38,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 417.36,
"r_x1": 456.65,
"r_y1": 417.36,
"r_x2": 456.65,
"r_y2": 411.04,
"r_x3": 450.33,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 417.36,
"r_x1": 469.6,
"r_y1": 417.36,
"r_x2": 469.6,
"r_y2": 411.04,
"r_x3": 463.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 427.39,
"r_x1": 391.6,
"r_y1": 427.39,
"r_x2": 391.6,
"r_y2": 421.07,
"r_x3": 385.28,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 427.39,
"r_x1": 404.84,
"r_y1": 427.39,
"r_x2": 404.84,
"r_y2": 421.07,
"r_x3": 398.52,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 427.39,
"r_x1": 417.8,
"r_y1": 427.39,
"r_x2": 417.8,
"r_y2": 421.07,
"r_x3": 411.48,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 427.39,
"r_x1": 430.75,
"r_y1": 427.39,
"r_x2": 430.75,
"r_y2": 421.07,
"r_x3": 424.43,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 427.39,
"r_x1": 443.7,
"r_y1": 427.39,
"r_x2": 443.7,
"r_y2": 421.07,
"r_x3": 437.38,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 427.39,
"r_x1": 456.65,
"r_y1": 427.39,
"r_x2": 456.65,
"r_y2": 421.07,
"r_x3": 450.33,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 427.39,
"r_x1": 469.61,
"r_y1": 427.39,
"r_x2": 469.61,
"r_y2": 421.07,
"r_x3": 463.29,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 427.39,
"r_x1": 482.56,
"r_y1": 427.39,
"r_x2": 482.56,
"r_y2": 421.07,
"r_x3": 476.24,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 427.39,
"r_x1": 495.51,
"r_y1": 427.39,
"r_x2": 495.51,
"r_y2": 421.07,
"r_x3": 489.19,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 427.39,
"r_x1": 508.46,
"r_y1": 427.39,
"r_x2": 508.46,
"r_y2": 421.07,
"r_x3": 502.14,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.39,
"r_x1": 521.42,
"r_y1": 427.39,
"r_x2": 521.42,
"r_y2": 421.07,
"r_x3": 515.1,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 427.39,
"r_x1": 534.37,
"r_y1": 427.39,
"r_x2": 534.37,
"r_y2": 421.07,
"r_x3": 528.05,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 438.36,
"r_x1": 391.6,
"r_y1": 438.36,
"r_x2": 391.6,
"r_y2": 432.04,
"r_x3": 385.28,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 438.36,
"r_x1": 404.84,
"r_y1": 438.36,
"r_x2": 404.84,
"r_y2": 432.04,
"r_x3": 398.52,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 438.36,
"r_x1": 417.8,
"r_y1": 438.36,
"r_x2": 417.8,
"r_y2": 432.04,
"r_x3": 411.48,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 438.36,
"r_x1": 430.75,
"r_y1": 438.36,
"r_x2": 430.75,
"r_y2": 432.04,
"r_x3": 424.43,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 438.36,
"r_x1": 443.7,
"r_y1": 438.36,
"r_x2": 443.7,
"r_y2": 432.04,
"r_x3": 437.38,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 438.36,
"r_x1": 456.65,
"r_y1": 438.36,
"r_x2": 456.65,
"r_y2": 432.04,
"r_x3": 450.33,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 438.36,
"r_x1": 469.61,
"r_y1": 438.36,
"r_x2": 469.61,
"r_y2": 432.04,
"r_x3": 463.29,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 438.36,
"r_x1": 482.56,
"r_y1": 438.36,
"r_x2": 482.56,
"r_y2": 432.04,
"r_x3": 476.24,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 438.36,
"r_x1": 495.51,
"r_y1": 438.36,
"r_x2": 495.51,
"r_y2": 432.04,
"r_x3": 489.19,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 438.36,
"r_x1": 508.46,
"r_y1": 438.36,
"r_x2": 508.46,
"r_y2": 432.04,
"r_x3": 502.14,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.36,
"r_x1": 521.42,
"r_y1": 438.36,
"r_x2": 521.42,
"r_y2": 432.04,
"r_x3": 515.1,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 438.36,
"r_x1": 534.37,
"r_y1": 438.36,
"r_x2": 534.37,
"r_y2": 432.04,
"r_x3": 528.05,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 395.52,
"r_x1": 388.44,
"r_y1": 395.52,
"r_x2": 388.44,
"r_y2": 389.2,
"r_x3": 385.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 395.52,
"r_x1": 401.68,
"r_y1": 395.52,
"r_x2": 401.68,
"r_y2": 389.2,
"r_x3": 398.52,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 395.52,
"r_x1": 414.63,
"r_y1": 395.52,
"r_x2": 414.63,
"r_y2": 389.2,
"r_x3": 411.48,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 395.52,
"r_x1": 427.59,
"r_y1": 395.52,
"r_x2": 427.59,
"r_y2": 389.2,
"r_x3": 424.43,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 395.52,
"r_x1": 440.54,
"r_y1": 395.52,
"r_x2": 440.54,
"r_y2": 389.2,
"r_x3": 437.38,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 395.52,
"r_x1": 453.49,
"r_y1": 395.52,
"r_x2": 453.49,
"r_y2": 389.2,
"r_x3": 450.33,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 395.52,
"r_x1": 466.44,
"r_y1": 395.52,
"r_x2": 466.44,
"r_y2": 389.2,
"r_x3": 463.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 395.52,
"r_x1": 479.39,
"r_y1": 395.52,
"r_x2": 479.39,
"r_y2": 389.2,
"r_x3": 476.24,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 395.52,
"r_x1": 492.35,
"r_y1": 395.52,
"r_x2": 492.35,
"r_y2": 389.2,
"r_x3": 489.19,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 395.52,
"r_x1": 505.3,
"r_y1": 395.52,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.14,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.09,
"r_y0": 395.52,
"r_x1": 521.41,
"r_y1": 395.52,
"r_x2": 521.41,
"r_y2": 389.2,
"r_x3": 515.09,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.04,
"r_y0": 395.52,
"r_x1": 534.13,
"r_y1": 395.52,
"r_x2": 534.13,
"r_y2": 389.2,
"r_x3": 528.04,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 405.29,
"r_x1": 391.6,
"r_y1": 405.29,
"r_x2": 391.6,
"r_y2": 398.97,
"r_x3": 385.28,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 405.29,
"r_x1": 404.84,
"r_y1": 405.29,
"r_x2": 404.84,
"r_y2": 398.97,
"r_x3": 398.52,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 405.29,
"r_x1": 417.8,
"r_y1": 405.29,
"r_x2": 417.8,
"r_y2": 398.97,
"r_x3": 411.48,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 413.09,
"r_x1": 430.75,
"r_y1": 413.09,
"r_x2": 430.75,
"r_y2": 406.77,
"r_x3": 424.43,
"r_y3": 406.77,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.87,
"r_y0": 417.31,
"r_x1": 509.19,
"r_y1": 417.31,
"r_x2": 509.19,
"r_y2": 410.99,
"r_x3": 502.87,
"r_y3": 410.99,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.35,
"r_y0": 386.44,
"r_x1": 430.99,
"r_y1": 386.44,
"r_x2": 430.99,
"r_y2": 381.78,
"r_x3": 384.35,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 169,
"label": "text",
"bbox": {
"l": 437.38,
"t": 400.55,
"r": 443.7,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 406.87,
"r_x1": 443.7,
"r_y1": 406.87,
"r_x2": 443.7,
"r_y2": 400.55,
"r_x3": 437.38,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 170,
"label": "text",
"bbox": {
"l": 450.33,
"t": 400.55,
"r": 456.65,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 406.87,
"r_x1": 456.65,
"r_y1": 406.87,
"r_x2": 456.65,
"r_y2": 400.55,
"r_x3": 450.33,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 171,
"label": "text",
"bbox": {
"l": 463.28,
"t": 400.55,
"r": 469.6,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 406.87,
"r_x1": 469.6,
"r_y1": 406.87,
"r_x2": 469.6,
"r_y2": 400.55,
"r_x3": 463.28,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 172,
"label": "text",
"bbox": {
"l": 476.24,
"t": 400.55,
"r": 482.56,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 406.87,
"r_x1": 482.56,
"r_y1": 406.87,
"r_x2": 482.56,
"r_y2": 400.55,
"r_x3": 476.24,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 173,
"label": "text",
"bbox": {
"l": 489.19,
"t": 400.55,
"r": 495.51,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 406.87,
"r_x1": 495.51,
"r_y1": 406.87,
"r_x2": 495.51,
"r_y2": 400.55,
"r_x3": 489.19,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 174,
"label": "text",
"bbox": {
"l": 502.14,
"t": 400.55,
"r": 508.46,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 406.87,
"r_x1": 508.46,
"r_y1": 406.87,
"r_x2": 508.46,
"r_y2": 400.55,
"r_x3": 502.14,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 175,
"label": "text",
"bbox": {
"l": 515.1,
"t": 400.55,
"r": 521.41,
"b": 406.87,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.87,
"r_x1": 521.41,
"r_y1": 406.87,
"r_x2": 521.41,
"r_y2": 400.55,
"r_x3": 515.1,
"r_y3": 400.55,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 176,
"label": "text",
"bbox": {
"l": 385.28,
"t": 411.04,
"r": 391.6,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 417.36,
"r_x1": 391.6,
"r_y1": 417.36,
"r_x2": 391.6,
"r_y2": 411.04,
"r_x3": 385.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 177,
"label": "text",
"bbox": {
"l": 398.52,
"t": 411.04,
"r": 404.84,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 417.36,
"r_x1": 404.84,
"r_y1": 417.36,
"r_x2": 404.84,
"r_y2": 411.04,
"r_x3": 398.52,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 178,
"label": "text",
"bbox": {
"l": 411.48,
"t": 411.04,
"r": 417.8,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 417.36,
"r_x1": 417.8,
"r_y1": 417.36,
"r_x2": 417.8,
"r_y2": 411.04,
"r_x3": 411.48,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 179,
"label": "text",
"bbox": {
"l": 437.38,
"t": 411.04,
"r": 443.7,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 417.36,
"r_x1": 443.7,
"r_y1": 417.36,
"r_x2": 443.7,
"r_y2": 411.04,
"r_x3": 437.38,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 180,
"label": "text",
"bbox": {
"l": 450.33,
"t": 411.04,
"r": 456.65,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 417.36,
"r_x1": 456.65,
"r_y1": 417.36,
"r_x2": 456.65,
"r_y2": 411.04,
"r_x3": 450.33,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 181,
"label": "text",
"bbox": {
"l": 463.28,
"t": 411.04,
"r": 469.6,
"b": 417.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 417.36,
"r_x1": 469.6,
"r_y1": 417.36,
"r_x2": 469.6,
"r_y2": 411.04,
"r_x3": 463.28,
"r_y3": 411.04,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 182,
"label": "text",
"bbox": {
"l": 385.28,
"t": 421.07,
"r": 391.6,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 427.39,
"r_x1": 391.6,
"r_y1": 427.39,
"r_x2": 391.6,
"r_y2": 421.07,
"r_x3": 385.28,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 183,
"label": "text",
"bbox": {
"l": 398.52,
"t": 421.07,
"r": 404.84,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 427.39,
"r_x1": 404.84,
"r_y1": 427.39,
"r_x2": 404.84,
"r_y2": 421.07,
"r_x3": 398.52,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 184,
"label": "text",
"bbox": {
"l": 411.48,
"t": 421.07,
"r": 417.8,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 427.39,
"r_x1": 417.8,
"r_y1": 427.39,
"r_x2": 417.8,
"r_y2": 421.07,
"r_x3": 411.48,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 185,
"label": "text",
"bbox": {
"l": 424.43,
"t": 421.07,
"r": 430.75,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 427.39,
"r_x1": 430.75,
"r_y1": 427.39,
"r_x2": 430.75,
"r_y2": 421.07,
"r_x3": 424.43,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 186,
"label": "text",
"bbox": {
"l": 437.38,
"t": 421.07,
"r": 443.7,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 427.39,
"r_x1": 443.7,
"r_y1": 427.39,
"r_x2": 443.7,
"r_y2": 421.07,
"r_x3": 437.38,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 187,
"label": "text",
"bbox": {
"l": 450.33,
"t": 421.07,
"r": 456.65,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 427.39,
"r_x1": 456.65,
"r_y1": 427.39,
"r_x2": 456.65,
"r_y2": 421.07,
"r_x3": 450.33,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 188,
"label": "text",
"bbox": {
"l": 463.29,
"t": 421.07,
"r": 469.61,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 427.39,
"r_x1": 469.61,
"r_y1": 427.39,
"r_x2": 469.61,
"r_y2": 421.07,
"r_x3": 463.29,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 189,
"label": "text",
"bbox": {
"l": 476.24,
"t": 421.07,
"r": 482.56,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 427.39,
"r_x1": 482.56,
"r_y1": 427.39,
"r_x2": 482.56,
"r_y2": 421.07,
"r_x3": 476.24,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 190,
"label": "text",
"bbox": {
"l": 489.19,
"t": 421.07,
"r": 495.51,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 427.39,
"r_x1": 495.51,
"r_y1": 427.39,
"r_x2": 495.51,
"r_y2": 421.07,
"r_x3": 489.19,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 191,
"label": "text",
"bbox": {
"l": 502.14,
"t": 421.07,
"r": 508.46,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 427.39,
"r_x1": 508.46,
"r_y1": 427.39,
"r_x2": 508.46,
"r_y2": 421.07,
"r_x3": 502.14,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 192,
"label": "text",
"bbox": {
"l": 515.1,
"t": 421.07,
"r": 521.42,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.39,
"r_x1": 521.42,
"r_y1": 427.39,
"r_x2": 521.42,
"r_y2": 421.07,
"r_x3": 515.1,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 193,
"label": "text",
"bbox": {
"l": 528.05,
"t": 421.07,
"r": 534.37,
"b": 427.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 427.39,
"r_x1": 534.37,
"r_y1": 427.39,
"r_x2": 534.37,
"r_y2": 421.07,
"r_x3": 528.05,
"r_y3": 421.07,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 194,
"label": "text",
"bbox": {
"l": 385.28,
"t": 432.04,
"r": 391.6,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 438.36,
"r_x1": 391.6,
"r_y1": 438.36,
"r_x2": 391.6,
"r_y2": 432.04,
"r_x3": 385.28,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 195,
"label": "text",
"bbox": {
"l": 398.52,
"t": 432.04,
"r": 404.84,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 438.36,
"r_x1": 404.84,
"r_y1": 438.36,
"r_x2": 404.84,
"r_y2": 432.04,
"r_x3": 398.52,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 196,
"label": "text",
"bbox": {
"l": 411.48,
"t": 432.04,
"r": 417.8,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 438.36,
"r_x1": 417.8,
"r_y1": 438.36,
"r_x2": 417.8,
"r_y2": 432.04,
"r_x3": 411.48,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 197,
"label": "text",
"bbox": {
"l": 424.43,
"t": 432.04,
"r": 430.75,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 438.36,
"r_x1": 430.75,
"r_y1": 438.36,
"r_x2": 430.75,
"r_y2": 432.04,
"r_x3": 424.43,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 198,
"label": "text",
"bbox": {
"l": 437.38,
"t": 432.04,
"r": 443.7,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 438.36,
"r_x1": 443.7,
"r_y1": 438.36,
"r_x2": 443.7,
"r_y2": 432.04,
"r_x3": 437.38,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 199,
"label": "text",
"bbox": {
"l": 450.33,
"t": 432.04,
"r": 456.65,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 438.36,
"r_x1": 456.65,
"r_y1": 438.36,
"r_x2": 456.65,
"r_y2": 432.04,
"r_x3": 450.33,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 200,
"label": "text",
"bbox": {
"l": 463.29,
"t": 432.04,
"r": 469.61,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.29,
"r_y0": 438.36,
"r_x1": 469.61,
"r_y1": 438.36,
"r_x2": 469.61,
"r_y2": 432.04,
"r_x3": 463.29,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 201,
"label": "text",
"bbox": {
"l": 476.24,
"t": 432.04,
"r": 482.56,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 438.36,
"r_x1": 482.56,
"r_y1": 438.36,
"r_x2": 482.56,
"r_y2": 432.04,
"r_x3": 476.24,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 202,
"label": "text",
"bbox": {
"l": 489.19,
"t": 432.04,
"r": 495.51,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 438.36,
"r_x1": 495.51,
"r_y1": 438.36,
"r_x2": 495.51,
"r_y2": 432.04,
"r_x3": 489.19,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 203,
"label": "text",
"bbox": {
"l": 502.14,
"t": 432.04,
"r": 508.46,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 438.36,
"r_x1": 508.46,
"r_y1": 438.36,
"r_x2": 508.46,
"r_y2": 432.04,
"r_x3": 502.14,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 204,
"label": "text",
"bbox": {
"l": 515.1,
"t": 432.04,
"r": 521.42,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.36,
"r_x1": 521.42,
"r_y1": 438.36,
"r_x2": 521.42,
"r_y2": 432.04,
"r_x3": 515.1,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 205,
"label": "text",
"bbox": {
"l": 528.05,
"t": 432.04,
"r": 534.37,
"b": 438.36,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.05,
"r_y0": 438.36,
"r_x1": 534.37,
"r_y1": 438.36,
"r_x2": 534.37,
"r_y2": 432.04,
"r_x3": 528.05,
"r_y3": 432.04,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 206,
"label": "text",
"bbox": {
"l": 385.28,
"t": 389.2,
"r": 388.44,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 395.52,
"r_x1": 388.44,
"r_y1": 395.52,
"r_x2": 388.44,
"r_y2": 389.2,
"r_x3": 385.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 207,
"label": "text",
"bbox": {
"l": 398.52,
"t": 389.2,
"r": 401.68,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 395.52,
"r_x1": 401.68,
"r_y1": 395.52,
"r_x2": 401.68,
"r_y2": 389.2,
"r_x3": 398.52,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 208,
"label": "text",
"bbox": {
"l": 411.48,
"t": 389.2,
"r": 414.63,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 395.52,
"r_x1": 414.63,
"r_y1": 395.52,
"r_x2": 414.63,
"r_y2": 389.2,
"r_x3": 411.48,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 209,
"label": "text",
"bbox": {
"l": 424.43,
"t": 389.2,
"r": 427.59,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 395.52,
"r_x1": 427.59,
"r_y1": 395.52,
"r_x2": 427.59,
"r_y2": 389.2,
"r_x3": 424.43,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 210,
"label": "text",
"bbox": {
"l": 437.38,
"t": 389.2,
"r": 440.54,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.38,
"r_y0": 395.52,
"r_x1": 440.54,
"r_y1": 395.52,
"r_x2": 440.54,
"r_y2": 389.2,
"r_x3": 437.38,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 211,
"label": "text",
"bbox": {
"l": 450.33,
"t": 389.2,
"r": 453.49,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.33,
"r_y0": 395.52,
"r_x1": 453.49,
"r_y1": 395.52,
"r_x2": 453.49,
"r_y2": 389.2,
"r_x3": 450.33,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 212,
"label": "text",
"bbox": {
"l": 463.28,
"t": 389.2,
"r": 466.44,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.28,
"r_y0": 395.52,
"r_x1": 466.44,
"r_y1": 395.52,
"r_x2": 466.44,
"r_y2": 389.2,
"r_x3": 463.28,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 213,
"label": "text",
"bbox": {
"l": 476.24,
"t": 389.2,
"r": 479.39,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.24,
"r_y0": 395.52,
"r_x1": 479.39,
"r_y1": 395.52,
"r_x2": 479.39,
"r_y2": 389.2,
"r_x3": 476.24,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 214,
"label": "text",
"bbox": {
"l": 489.19,
"t": 389.2,
"r": 492.35,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.19,
"r_y0": 395.52,
"r_x1": 492.35,
"r_y1": 395.52,
"r_x2": 492.35,
"r_y2": 389.2,
"r_x3": 489.19,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 215,
"label": "text",
"bbox": {
"l": 502.14,
"t": 389.2,
"r": 505.3,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.14,
"r_y0": 395.52,
"r_x1": 505.3,
"r_y1": 395.52,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.14,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 216,
"label": "text",
"bbox": {
"l": 515.09,
"t": 389.2,
"r": 521.41,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.09,
"r_y0": 395.52,
"r_x1": 521.41,
"r_y1": 395.52,
"r_x2": 521.41,
"r_y2": 389.2,
"r_x3": 515.09,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 217,
"label": "text",
"bbox": {
"l": 528.04,
"t": 389.2,
"r": 534.13,
"b": 395.52,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.04,
"r_y0": 395.52,
"r_x1": 534.13,
"r_y1": 395.52,
"r_x2": 534.13,
"r_y2": 389.2,
"r_x3": 528.04,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 218,
"label": "text",
"bbox": {
"l": 385.28,
"t": 398.97,
"r": 391.6,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.28,
"r_y0": 405.29,
"r_x1": 391.6,
"r_y1": 405.29,
"r_x2": 391.6,
"r_y2": 398.97,
"r_x3": 385.28,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 219,
"label": "text",
"bbox": {
"l": 398.52,
"t": 398.97,
"r": 404.84,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.52,
"r_y0": 405.29,
"r_x1": 404.84,
"r_y1": 405.29,
"r_x2": 404.84,
"r_y2": 398.97,
"r_x3": 398.52,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 220,
"label": "text",
"bbox": {
"l": 411.48,
"t": 398.97,
"r": 417.8,
"b": 405.29,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.48,
"r_y0": 405.29,
"r_x1": 417.8,
"r_y1": 405.29,
"r_x2": 417.8,
"r_y2": 398.97,
"r_x3": 411.48,
"r_y3": 398.97,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 221,
"label": "text",
"bbox": {
"l": 424.43,
"t": 406.77,
"r": 430.75,
"b": 413.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.43,
"r_y0": 413.09,
"r_x1": 430.75,
"r_y1": 413.09,
"r_x2": 430.75,
"r_y2": 406.77,
"r_x3": 424.43,
"r_y3": 406.77,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 222,
"label": "text",
"bbox": {
"l": 502.87,
"t": 410.99,
"r": 509.19,
"b": 417.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.87,
"r_y0": 417.31,
"r_x1": 509.19,
"r_y1": 417.31,
"r_x2": 509.19,
"r_y2": 410.99,
"r_x3": 502.87,
"r_y3": 410.99,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 223,
"label": "text",
"bbox": {
"l": 384.35,
"t": 381.78,
"r": 430.99,
"b": 386.44,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.35,
"r_y0": 386.44,
"r_x1": 430.99,
"r_y1": 386.44,
"r_x2": 430.99,
"r_y2": 381.78,
"r_x3": 384.35,
"r_y3": 381.78,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 5,
"page_no": 7,
"cluster": {
"id": 5,
"label": "caption",
"bbox": {
"l": 62.6,
"t": 458.73,
"r": 532.63,
"b": 467.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.915,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.6,
"r_y0": 467.63,
"r_x1": 532.63,
"r_y1": 467.63,
"r_x2": 532.63,
"r_y2": 458.73,
"r_x3": 62.6,
"r_y3": 458.73,
"coord_origin": "TOPLEFT"
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table."
},
{
"label": "section_header",
"id": 2,
"page_no": 7,
"cluster": {
"id": 2,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 491.4,
"r": 163.76,
"b": 501.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 501.25,
"r_x1": 64.45,
"r_y1": 501.25,
"r_x2": 64.45,
"r_y2": 491.4,
"r_x3": 50.11,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "5.5.",
"orig": "5.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.01,
"r_y0": 501.25,
"r_x1": 163.76,
"r_y1": 501.25,
"r_x2": 163.76,
"r_y2": 491.4,
"r_x3": 74.01,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "Qualitative Analysis",
"orig": "Qualitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.5. Qualitative Analysis"
},
{
"label": "text",
"id": 1,
"page_no": 7,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 536.87,
"r": 286.37,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.985,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 545.78,
"r_x1": 286.36,
"r_y1": 545.78,
"r_x2": 286.36,
"r_y2": 536.87,
"r_x3": 62.07,
"r_y3": 536.87,
"coord_origin": "TOPLEFT"
},
"text": "We showcase several visualizations for the different",
"orig": "We showcase several visualizations for the different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 557.73,
"r_x1": 211.16,
"r_y1": 557.73,
"r_x2": 211.16,
"r_y2": 548.83,
"r_x3": 50.11,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "components of our network on various",
"orig": "components of our network on various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 215.1,
"r_y0": 557.51,
"r_x1": 259.17,
"r_y1": 557.51,
"r_x2": 259.17,
"r_y2": 548.92,
"r_x3": 215.1,
"r_y3": 548.92,
"coord_origin": "TOPLEFT"
},
"text": "\u201ccomplex\u201d",
"orig": "\u201ccomplex\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.12,
"r_y0": 557.73,
"r_x1": 286.36,
"r_y1": 557.73,
"r_x2": 286.36,
"r_y2": 548.83,
"r_x3": 263.12,
"r_y3": 548.83,
"coord_origin": "TOPLEFT"
},
"text": "tables",
"orig": "tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 569.69,
"r_x1": 286.37,
"r_y1": 569.69,
"r_x2": 286.37,
"r_y2": 560.78,
"r_x3": 50.11,
"r_y3": 560.78,
"coord_origin": "TOPLEFT"
},
"text": "within datasets presented in this work in Fig. 5 and Fig. 6",
"orig": "within datasets presented in this work in Fig. 5 and Fig. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 581.64,
"r_x1": 286.37,
"r_y1": 581.64,
"r_x2": 286.37,
"r_y2": 572.74,
"r_x3": 50.11,
"r_y3": 572.74,
"coord_origin": "TOPLEFT"
},
"text": "As it is shown, our model is able to predict bounding boxes",
"orig": "As it is shown, our model is able to predict bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 593.6,
"r_x1": 286.37,
"r_y1": 593.6,
"r_x2": 286.37,
"r_y2": 584.69,
"r_x3": 50.11,
"r_y3": 584.69,
"coord_origin": "TOPLEFT"
},
"text": "for all table cells, even for the empty ones. Additionally,",
"orig": "for all table cells, even for the empty ones. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 605.56,
"r_x1": 286.37,
"r_y1": 605.56,
"r_x2": 286.37,
"r_y2": 596.65,
"r_x3": 50.11,
"r_y3": 596.65,
"coord_origin": "TOPLEFT"
},
"text": "our post-processing techniques can extract the cell content",
"orig": "our post-processing techniques can extract the cell content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 617.51,
"r_x1": 286.37,
"r_y1": 617.51,
"r_x2": 286.37,
"r_y2": 608.6,
"r_x3": 50.11,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "by matching the predicted bounding boxes to the PDF cells",
"orig": "by matching the predicted bounding boxes to the PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 629.47,
"r_x1": 286.37,
"r_y1": 629.47,
"r_x2": 286.37,
"r_y2": 620.56,
"r_x3": 50.11,
"r_y3": 620.56,
"coord_origin": "TOPLEFT"
},
"text": "based on their overlap and spatial proximity. The left part",
"orig": "based on their overlap and spatial proximity. The left part",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 641.42,
"r_x1": 286.37,
"r_y1": 641.42,
"r_x2": 286.37,
"r_y2": 632.51,
"r_x3": 50.11,
"r_y3": 632.51,
"coord_origin": "TOPLEFT"
},
"text": "of Fig. 5 demonstrates also the adaptability of our method",
"orig": "of Fig. 5 demonstrates also the adaptability of our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 653.38,
"r_x1": 286.37,
"r_y1": 653.38,
"r_x2": 286.37,
"r_y2": 644.47,
"r_x3": 50.11,
"r_y3": 644.47,
"coord_origin": "TOPLEFT"
},
"text": "to any language, as it can successfully extract Japanese",
"orig": "to any language, as it can successfully extract Japanese",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 665.33,
"r_x1": 286.37,
"r_y1": 665.33,
"r_x2": 286.37,
"r_y2": 656.42,
"r_x3": 50.11,
"r_y3": 656.42,
"coord_origin": "TOPLEFT"
},
"text": "text, although the training set contains only English content.",
"orig": "text, although the training set contains only English content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 677.29,
"r_x1": 286.37,
"r_y1": 677.29,
"r_x2": 286.37,
"r_y2": 668.38,
"r_x3": 50.11,
"r_y3": 668.38,
"coord_origin": "TOPLEFT"
},
"text": "We provide more visualizations including the intermediate",
"orig": "We provide more visualizations including the intermediate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 689.24,
"r_x1": 286.37,
"r_y1": 689.24,
"r_x2": 286.37,
"r_y2": 680.34,
"r_x3": 50.11,
"r_y3": 680.34,
"coord_origin": "TOPLEFT"
},
"text": "steps in the supplementary material. Overall these illustra-",
"orig": "steps in the supplementary material. Overall these illustra-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.2,
"r_x1": 286.37,
"r_y1": 701.2,
"r_x2": 286.37,
"r_y2": 692.29,
"r_x3": 50.11,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "tions justify the versatility of our method across a diverse",
"orig": "tions justify the versatility of our method across a diverse",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 226.89,
"r_y1": 713.15,
"r_x2": 226.89,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "range of table appearances and content type.",
"orig": "range of table appearances and content type.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We showcase several visualizations for the different components of our network on various \"complex\" tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type."
},
{
"label": "section_header",
"id": 4,
"page_no": 7,
"cluster": {
"id": 4,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 490.71,
"r": 460.85,
"b": 501.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.944,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 501.46,
"r_x1": 316.07,
"r_y1": 501.46,
"r_x2": 316.07,
"r_y2": 490.71,
"r_x3": 308.86,
"r_y3": 490.71,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.69,
"r_y0": 501.46,
"r_x1": 460.85,
"r_y1": 501.46,
"r_x2": 460.85,
"r_y2": 490.71,
"r_x3": 325.69,
"r_y3": 490.71,
"coord_origin": "TOPLEFT"
},
"text": "Future Work & Conclusion",
"orig": "Future Work & Conclusion",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6. Future Work & Conclusion"
},
{
"label": "text",
"id": 0,
"page_no": 7,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.86,
"t": 512.89,
"r": 545.12,
"b": 653.31,
"coord_origin": "TOPLEFT"
},
"confidence": 0.988,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 521.8,
"r_x1": 545.12,
"r_y1": 521.8,
"r_x2": 545.12,
"r_y2": 512.89,
"r_x3": 320.82,
"r_y3": 512.89,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we presented TableFormer an end-to-end",
"orig": "In this paper, we presented TableFormer an end-to-end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 533.75,
"r_x1": 545.12,
"r_y1": 533.75,
"r_x2": 545.12,
"r_y2": 524.85,
"r_x3": 308.86,
"r_y3": 524.85,
"coord_origin": "TOPLEFT"
},
"text": "transformer based approach to predict table structures and",
"orig": "transformer based approach to predict table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.71,
"r_x1": 545.12,
"r_y1": 545.71,
"r_x2": 545.12,
"r_y2": 536.8,
"r_x3": 308.86,
"r_y3": 536.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes of cells from an image. This approach en-",
"orig": "bounding boxes of cells from an image. This approach en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 557.66,
"r_x1": 545.12,
"r_y1": 557.66,
"r_x2": 545.12,
"r_y2": 548.76,
"r_x3": 308.86,
"r_y3": 548.76,
"coord_origin": "TOPLEFT"
},
"text": "ables us to recreate the table structure, and extract the cell",
"orig": "ables us to recreate the table structure, and extract the cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.62,
"r_x1": 545.12,
"r_y1": 569.62,
"r_x2": 545.12,
"r_y2": 560.71,
"r_x3": 308.86,
"r_y3": 560.71,
"coord_origin": "TOPLEFT"
},
"text": "content from PDF or OCR by using bounding boxes. Ad-",
"orig": "content from PDF or OCR by using bounding boxes. Ad-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 581.57,
"r_x1": 545.12,
"r_y1": 581.57,
"r_x2": 545.12,
"r_y2": 572.67,
"r_x3": 308.86,
"r_y3": 572.67,
"coord_origin": "TOPLEFT"
},
"text": "ditionally, it provides the versatility required in real-world",
"orig": "ditionally, it provides the versatility required in real-world",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 593.53,
"r_x1": 545.12,
"r_y1": 593.53,
"r_x2": 545.12,
"r_y2": 584.62,
"r_x3": 308.86,
"r_y3": 584.62,
"coord_origin": "TOPLEFT"
},
"text": "scenarios when dealing with various types of PDF docu-",
"orig": "scenarios when dealing with various types of PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 605.49,
"r_x1": 400.47,
"r_y1": 605.49,
"r_x2": 400.47,
"r_y2": 596.58,
"r_x3": 308.86,
"r_y3": 596.58,
"coord_origin": "TOPLEFT"
},
"text": "ments, and languages.",
"orig": "ments, and languages.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.38,
"r_y0": 605.49,
"r_x1": 545.12,
"r_y1": 605.49,
"r_x2": 545.12,
"r_y2": 596.58,
"r_x3": 408.38,
"r_y3": 596.58,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, our method outper-",
"orig": "Furthermore, our method outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 617.44,
"r_x1": 545.12,
"r_y1": 617.44,
"r_x2": 545.12,
"r_y2": 608.53,
"r_x3": 308.86,
"r_y3": 608.53,
"coord_origin": "TOPLEFT"
},
"text": "forms all state-of-the-arts with a wide margin. Finally, we",
"orig": "forms all state-of-the-arts with a wide margin. Finally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 629.4,
"r_x1": 545.12,
"r_y1": 629.4,
"r_x2": 545.12,
"r_y2": 620.49,
"r_x3": 308.86,
"r_y3": 620.49,
"coord_origin": "TOPLEFT"
},
"text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 641.35,
"r_x1": 545.12,
"r_y1": 641.35,
"r_x2": 545.12,
"r_y2": 632.44,
"r_x3": 308.86,
"r_y3": 632.44,
"coord_origin": "TOPLEFT"
},
"text": "erated dataset that reinforces missing characteristics from",
"orig": "erated dataset that reinforces missing characteristics from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 653.31,
"r_x1": 365.86,
"r_y1": 653.31,
"r_x2": 365.86,
"r_y2": 644.4,
"r_x3": 308.86,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "other datasets.",
"orig": "other datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce \"SynthTabNet\" a challenging synthetically generated dataset that reinforces missing characteristics from other datasets."
},
{
"label": "section_header",
"id": 3,
"page_no": 7,
"cluster": {
"id": 3,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 672.1,
"r": 364.41,
"b": 682.85,
"coord_origin": "TOPLEFT"
},
"confidence": 0.944,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 682.85,
"r_x1": 364.41,
"r_y1": 682.85,
"r_x2": 364.41,
"r_y2": 672.1,
"r_x3": 308.86,
"r_y3": 672.1,
"coord_origin": "TOPLEFT"
},
"text": "References",
"orig": "References",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "References"
},
{
"label": "list_item",
"id": 10,
"page_no": 7,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 313.35,
"t": 693.96,
"r": 545.11,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.832,
"cells": [
{
"index": 217,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.35,
"r_y0": 701.98,
"r_x1": 323.81,
"r_y1": 701.98,
"r_x2": 323.81,
"r_y2": 693.96,
"r_x3": 313.35,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "[1]",
"orig": "[1]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 218,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.05,
"r_y0": 701.98,
"r_x1": 545.11,
"r_y1": 701.98,
"r_x2": 545.11,
"r_y2": 693.96,
"r_x3": 326.05,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 219,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 712.94,
"r_x1": 545.11,
"r_y1": 712.94,
"r_x2": 545.11,
"r_y2": 704.92,
"r_x3": 328.78,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-"
},
{
"label": "picture",
"id": 15,
"page_no": 7,
"cluster": {
"id": 15,
"label": "picture",
"bbox": {
"l": 305.58,
"t": 98.65,
"r": 554.83,
"b": 180.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 14,
"page_no": 7,
"cluster": {
"id": 14,
"label": "picture",
"bbox": {
"l": 49.98,
"t": 103.71,
"r": 301.63,
"b": 187.58,
"coord_origin": "TOPLEFT"
},
"confidence": 0.787,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"headers": [
{
"label": "page_footer",
"id": 9,
"page_no": 7,
"cluster": {
"id": 9,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.871,
"cells": [
{
"index": 220,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "8"
}
]
}
},
{
"page_no": 8,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 83.9,
"r_x1": 286.36,
"r_y1": 83.9,
"r_x2": 286.36,
"r_y2": 75.88,
"r_x3": 70.03,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "end object detection with transformers. In Andrea Vedaldi,",
"orig": "end object detection with transformers. In Andrea Vedaldi,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 94.86,
"r_x1": 286.36,
"r_y1": 94.86,
"r_x2": 286.36,
"r_y2": 86.84,
"r_x3": 70.03,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 105.82,
"r_x1": 85.72,
"r_y1": 105.82,
"r_x2": 85.72,
"r_y2": 97.8,
"r_x3": 70.03,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "tors,",
"orig": "tors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 87.89,
"r_y0": 105.61,
"r_x1": 199.93,
"r_y1": 105.61,
"r_x2": 199.93,
"r_y2": 97.88,
"r_x3": 87.89,
"r_y3": 97.88,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision - ECCV 2020",
"orig": "Computer Vision - ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.94,
"r_y0": 105.82,
"r_x1": 286.36,
"r_y1": 105.82,
"r_x2": 286.36,
"r_y2": 97.8,
"r_x3": 199.94,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 213-229, Cham,",
"orig": ", pages 213-229, Cham,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 116.78,
"r_x1": 221.95,
"r_y1": 116.78,
"r_x2": 221.95,
"r_y2": 108.76,
"r_x3": 70.03,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "2020. Springer International Publishing. 5",
"orig": "2020. Springer International Publishing. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 128.05,
"r_x1": 65.21,
"r_y1": 128.05,
"r_x2": 65.21,
"r_y2": 120.03,
"r_x3": 54.6,
"r_y3": 120.03,
"coord_origin": "TOPLEFT"
},
"text": "[2]",
"orig": "[2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.48,
"r_y0": 128.05,
"r_x1": 286.36,
"r_y1": 128.05,
"r_x2": 286.36,
"r_y2": 120.03,
"r_x3": 67.48,
"r_y3": 120.03,
"coord_origin": "TOPLEFT"
},
"text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 139.01,
"r_x1": 179.67,
"r_y1": 139.01,
"r_x2": 179.67,
"r_y2": 130.99,
"r_x3": 70.03,
"r_y3": 130.99,
"coord_origin": "TOPLEFT"
},
"text": "uan Yin, and Xian-Ling Mao.",
"orig": "uan Yin, and Xian-Ling Mao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.58,
"r_y0": 139.01,
"r_x1": 286.36,
"r_y1": 139.01,
"r_x2": 286.36,
"r_y2": 130.99,
"r_x3": 185.58,
"r_y3": 130.99,
"coord_origin": "TOPLEFT"
},
"text": "Complicated table structure",
"orig": "Complicated table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 149.97,
"r_x1": 113.11,
"r_y1": 149.97,
"r_x2": 113.11,
"r_y2": 141.95,
"r_x3": 70.03,
"r_y3": 141.95,
"coord_origin": "TOPLEFT"
},
"text": "recognition.",
"orig": "recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.34,
"r_y0": 149.76,
"r_x1": 235.31,
"r_y1": 149.76,
"r_x2": 235.31,
"r_y2": 142.03,
"r_x3": 116.34,
"r_y3": 142.03,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint arXiv:1908.04729",
"orig": "arXiv preprint arXiv:1908.04729",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 235.31,
"r_y0": 149.97,
"r_x1": 267.68,
"r_y1": 149.97,
"r_x2": 267.68,
"r_y2": 141.95,
"r_x3": 235.31,
"r_y3": 141.95,
"coord_origin": "TOPLEFT"
},
"text": ", 2019. 3",
"orig": ", 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 161.24,
"r_x1": 65.1,
"r_y1": 161.24,
"r_x2": 65.1,
"r_y2": 153.22,
"r_x3": 54.6,
"r_y3": 153.22,
"coord_origin": "TOPLEFT"
},
"text": "[3]",
"orig": "[3]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.36,
"r_y0": 161.24,
"r_x1": 218.78,
"r_y1": 161.24,
"r_x2": 218.78,
"r_y2": 153.22,
"r_x3": 67.36,
"r_y3": 153.22,
"coord_origin": "TOPLEFT"
},
"text": "Bertrand Couasnon and Aurelie Lemaitre.",
"orig": "Bertrand Couasnon and Aurelie Lemaitre.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.98,
"r_y0": 161.03,
"r_x1": 286.36,
"r_y1": 161.03,
"r_x2": 286.36,
"r_y2": 153.3,
"r_x3": 220.98,
"r_y3": 153.3,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of Ta-",
"orig": "Recognition of Ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 171.99,
"r_x1": 125.26,
"r_y1": 171.99,
"r_x2": 125.26,
"r_y2": 164.26,
"r_x3": 70.03,
"r_y3": 164.26,
"coord_origin": "TOPLEFT"
},
"text": "bles and Forms",
"orig": "bles and Forms",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.26,
"r_y0": 172.2,
"r_x1": 286.36,
"r_y1": 172.2,
"r_x2": 286.36,
"r_y2": 164.18,
"r_x3": 125.26,
"r_y3": 164.18,
"coord_origin": "TOPLEFT"
},
"text": ", pages 647-677. Springer London, London,",
"orig": ", pages 647-677. Springer London, London,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 183.15,
"r_x1": 97.92,
"r_y1": 183.15,
"r_x2": 97.92,
"r_y2": 175.14,
"r_x3": 70.03,
"r_y3": 175.14,
"coord_origin": "TOPLEFT"
},
"text": "2014. 2",
"orig": "2014. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 194.43,
"r_x1": 65.81,
"r_y1": 194.43,
"r_x2": 65.81,
"r_y2": 186.41,
"r_x3": 54.59,
"r_y3": 186.41,
"coord_origin": "TOPLEFT"
},
"text": "[4]",
"orig": "[4]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.21,
"r_y0": 194.43,
"r_x1": 286.36,
"r_y1": 194.43,
"r_x2": 286.36,
"r_y2": 186.41,
"r_x3": 68.21,
"r_y3": 186.41,
"coord_origin": "TOPLEFT"
},
"text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 205.39,
"r_x1": 286.36,
"r_y1": 205.39,
"r_x2": 286.36,
"r_y2": 197.37,
"r_x3": 70.03,
"r_y3": 197.37,
"coord_origin": "TOPLEFT"
},
"text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 216.34,
"r_x1": 286.36,
"r_y1": 216.34,
"r_x2": 286.36,
"r_y2": 208.33,
"r_x3": 70.03,
"r_y3": 208.33,
"coord_origin": "TOPLEFT"
},
"text": "DAR 2019 Competition on Table Detection and Recognition",
"orig": "DAR 2019 Competition on Table Detection and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 227.3,
"r_x1": 245.84,
"r_y1": 227.3,
"r_x2": 245.84,
"r_y2": 219.29,
"r_x3": 70.03,
"r_y3": 219.29,
"coord_origin": "TOPLEFT"
},
"text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 238.58,
"r_x1": 65.38,
"r_y1": 238.58,
"r_x2": 65.38,
"r_y2": 230.56,
"r_x3": 54.59,
"r_y3": 230.56,
"coord_origin": "TOPLEFT"
},
"text": "[5]",
"orig": "[5]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.69,
"r_y0": 238.58,
"r_x1": 286.36,
"r_y1": 238.58,
"r_x2": 286.36,
"r_y2": 230.56,
"r_x3": 67.69,
"r_y3": 230.56,
"coord_origin": "TOPLEFT"
},
"text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 249.53,
"r_x1": 286.36,
"r_y1": 249.53,
"r_x2": 286.36,
"r_y2": 241.52,
"r_x3": 70.03,
"r_y3": 241.52,
"coord_origin": "TOPLEFT"
},
"text": "Stavros J Perantonis. Automatic table detection in document",
"orig": "Stavros J Perantonis. Automatic table detection in document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 260.49,
"r_x1": 108.4,
"r_y1": 260.49,
"r_x2": 108.4,
"r_y2": 252.48,
"r_x3": 70.03,
"r_y3": 252.48,
"coord_origin": "TOPLEFT"
},
"text": "images. In",
"orig": "images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.64,
"r_y0": 260.29,
"r_x1": 286.36,
"r_y1": 260.29,
"r_x2": 286.36,
"r_y2": 252.56,
"r_x3": 110.64,
"r_y3": 252.56,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Pattern Recognition",
"orig": "International Conference on Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 271.25,
"r_x1": 140.58,
"r_y1": 271.25,
"r_x2": 140.58,
"r_y2": 263.52,
"r_x3": 70.03,
"r_y3": 263.52,
"coord_origin": "TOPLEFT"
},
"text": "and Image Analysis",
"orig": "and Image Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.58,
"r_y0": 271.45,
"r_x1": 266.48,
"r_y1": 271.45,
"r_x2": 266.48,
"r_y2": 263.44,
"r_x3": 140.58,
"r_y3": 263.44,
"coord_origin": "TOPLEFT"
},
"text": ", pages 609-618. Springer, 2005. 2",
"orig": ", pages 609-618. Springer, 2005. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 282.72,
"r_x1": 64.85,
"r_y1": 282.72,
"r_x2": 64.85,
"r_y2": 274.71,
"r_x3": 54.59,
"r_y3": 274.71,
"coord_origin": "TOPLEFT"
},
"text": "[6]",
"orig": "[6]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.05,
"r_y0": 282.72,
"r_x1": 286.37,
"r_y1": 282.72,
"r_x2": 286.37,
"r_y2": 274.71,
"r_x3": 67.05,
"r_y3": 274.71,
"coord_origin": "TOPLEFT"
},
"text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 293.68,
"r_x1": 179.57,
"r_y1": 293.68,
"r_x2": 179.57,
"r_y2": 285.67,
"r_x3": 70.03,
"r_y3": 285.67,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2013 table competition.",
"orig": "Icdar 2013 table competition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.02,
"r_y0": 293.68,
"r_x1": 194.48,
"r_y1": 293.68,
"r_x2": 194.48,
"r_y2": 285.67,
"r_x3": 187.02,
"r_y3": 285.67,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.04,
"r_y0": 293.48,
"r_x1": 286.36,
"r_y1": 293.48,
"r_x2": 286.36,
"r_y2": 285.75,
"r_x3": 198.04,
"r_y3": 285.75,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International",
"orig": "2013 12th International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 304.44,
"r_x1": 260.2,
"r_y1": 304.44,
"r_x2": 260.2,
"r_y2": 296.71,
"r_x3": 70.03,
"r_y3": 296.71,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition",
"orig": "Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.2,
"r_y0": 304.64,
"r_x1": 286.36,
"r_y1": 304.64,
"r_x2": 286.36,
"r_y2": 296.63,
"r_x3": 260.2,
"r_y3": 296.63,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 315.6,
"r_x1": 142.75,
"r_y1": 315.6,
"r_x2": 142.75,
"r_y2": 307.58,
"r_x3": 70.03,
"r_y3": 307.58,
"coord_origin": "TOPLEFT"
},
"text": "1449-1453, 2013. 2",
"orig": "1449-1453, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 326.87,
"r_x1": 65.62,
"r_y1": 326.87,
"r_x2": 65.62,
"r_y2": 318.86,
"r_x3": 54.59,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "[7]",
"orig": "[7]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.98,
"r_y0": 326.87,
"r_x1": 199.49,
"r_y1": 326.87,
"r_x2": 199.49,
"r_y2": 318.86,
"r_x3": 67.98,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "EA Green and M Krishnamoorthy.",
"orig": "EA Green and M Krishnamoorthy.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.99,
"r_y0": 326.87,
"r_x1": 286.36,
"r_y1": 326.87,
"r_x2": 286.36,
"r_y2": 318.86,
"r_x3": 206.99,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of tables",
"orig": "Recognition of tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 337.83,
"r_x1": 176.28,
"r_y1": 337.83,
"r_x2": 176.28,
"r_y2": 329.81,
"r_x3": 70.03,
"r_y3": 329.81,
"coord_origin": "TOPLEFT"
},
"text": "using table grammars. procs.",
"orig": "using table grammars. procs.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 337.83,
"r_x1": 190.07,
"r_y1": 337.83,
"r_x2": 190.07,
"r_y2": 329.81,
"r_x3": 182.6,
"r_y3": 329.81,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 193.28,
"r_y0": 337.62,
"r_x1": 286.36,
"r_y1": 337.62,
"r_x2": 286.36,
"r_y2": 329.9,
"r_x3": 193.28,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Symposium on Document",
"orig": "Symposium on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 348.58,
"r_x1": 206.35,
"r_y1": 348.58,
"r_x2": 206.35,
"r_y2": 340.85,
"r_x3": 70.03,
"r_y3": 340.85,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (SDAIR\u201995)",
"orig": "Analysis and Recognition (SDAIR\u201995)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.35,
"r_y0": 348.79,
"r_x1": 274.82,
"r_y1": 348.79,
"r_x2": 274.82,
"r_y2": 340.77,
"r_x3": 206.35,
"r_y3": 340.77,
"coord_origin": "TOPLEFT"
},
"text": ", pages 261-277. 2",
"orig": ", pages 261-277. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 360.06,
"r_x1": 65.05,
"r_y1": 360.06,
"r_x2": 65.05,
"r_y2": 352.05,
"r_x3": 54.59,
"r_y3": 352.05,
"coord_origin": "TOPLEFT"
},
"text": "[8]",
"orig": "[8]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.29,
"r_y0": 360.06,
"r_x1": 286.36,
"r_y1": 360.06,
"r_x2": 286.36,
"r_y2": 352.05,
"r_x3": 67.29,
"r_y3": 352.05,
"coord_origin": "TOPLEFT"
},
"text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 371.02,
"r_x1": 234.13,
"r_y1": 371.02,
"r_x2": 234.13,
"r_y2": 363.0,
"r_x3": 70.03,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "dier Stricker, and Muhammad Zeshan Afzal.",
"orig": "dier Stricker, and Muhammad Zeshan Afzal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.05,
"r_y0": 371.02,
"r_x1": 286.36,
"r_y1": 371.02,
"r_x2": 286.36,
"r_y2": 363.0,
"r_x3": 240.05,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "Castabdetec-",
"orig": "Castabdetec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 381.98,
"r_x1": 286.36,
"r_y1": 381.98,
"r_x2": 286.36,
"r_y2": 373.96,
"r_x3": 70.03,
"r_y3": 373.96,
"coord_origin": "TOPLEFT"
},
"text": "tors: Cascade network for table detection in document im-",
"orig": "tors: Cascade network for table detection in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 392.94,
"r_x1": 286.36,
"r_y1": 392.94,
"r_x2": 286.36,
"r_y2": 384.92,
"r_x3": 70.03,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "ages with recursive feature pyramid and switchable atrous",
"orig": "ages with recursive feature pyramid and switchable atrous",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 403.9,
"r_x1": 114.58,
"r_y1": 403.9,
"r_x2": 114.58,
"r_y2": 395.88,
"r_x3": 70.03,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": "convolution.",
"orig": "convolution.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.8,
"r_y0": 403.69,
"r_x1": 186.73,
"r_y1": 403.69,
"r_x2": 186.73,
"r_y2": 395.96,
"r_x3": 117.8,
"r_y3": 395.96,
"coord_origin": "TOPLEFT"
},
"text": "Journal of Imaging",
"orig": "Journal of Imaging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 186.73,
"r_y0": 403.9,
"r_x1": 243.0,
"r_y1": 403.9,
"r_x2": 243.0,
"r_y2": 395.88,
"r_x3": 186.73,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": ", 7(10), 2021. 1",
"orig": ", 7(10), 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 415.17,
"r_x1": 65.33,
"r_y1": 415.17,
"r_x2": 65.33,
"r_y2": 407.15,
"r_x3": 54.6,
"r_y3": 407.15,
"coord_origin": "TOPLEFT"
},
"text": "[9]",
"orig": "[9]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.64,
"r_y0": 415.17,
"r_x1": 286.36,
"r_y1": 415.17,
"r_x2": 286.36,
"r_y2": 407.15,
"r_x3": 67.64,
"r_y3": 407.15,
"coord_origin": "TOPLEFT"
},
"text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 426.13,
"r_x1": 147.13,
"r_y1": 426.13,
"r_x2": 147.13,
"r_y2": 418.11,
"r_x3": 70.03,
"r_y3": 418.11,
"coord_origin": "TOPLEFT"
},
"text": "shick. Mask r-cnn. In",
"orig": "shick. Mask r-cnn. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.16,
"r_y0": 425.92,
"r_x1": 286.36,
"r_y1": 425.92,
"r_x2": 286.36,
"r_y2": 418.19,
"r_x3": 149.16,
"r_y3": 418.19,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE International",
"orig": "Proceedings of the IEEE International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 436.88,
"r_x1": 213.48,
"r_y1": 436.88,
"r_x2": 213.48,
"r_y2": 429.15,
"r_x3": 70.03,
"r_y3": 429.15,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision (ICCV)",
"orig": "Conference on Computer Vision (ICCV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.48,
"r_y0": 437.09,
"r_x1": 261.04,
"r_y1": 437.09,
"r_x2": 261.04,
"r_y2": 429.07,
"r_x3": 213.48,
"r_y3": 429.07,
"coord_origin": "TOPLEFT"
},
"text": ", Oct 2017. 1",
"orig": ", Oct 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 448.36,
"r_x1": 65.4,
"r_y1": 448.36,
"r_x2": 65.4,
"r_y2": 440.34,
"r_x3": 50.11,
"r_y3": 440.34,
"coord_origin": "TOPLEFT"
},
"text": "[10]",
"orig": "[10]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.69,
"r_y0": 448.36,
"r_x1": 286.36,
"r_y1": 448.36,
"r_x2": 286.36,
"r_y2": 440.34,
"r_x3": 67.69,
"r_y3": 440.34,
"coord_origin": "TOPLEFT"
},
"text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 459.32,
"r_x1": 202.74,
"r_y1": 459.32,
"r_x2": 202.74,
"r_y2": 451.3,
"r_x3": 70.03,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "cong Li, Xin Tang, and Rong Xiao.",
"orig": "cong Li, Xin Tang, and Rong Xiao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 459.32,
"r_x1": 286.36,
"r_y1": 459.32,
"r_x2": 286.36,
"r_y2": 451.3,
"r_x3": 209.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "Pingan-vcgroup\u2019s so-",
"orig": "Pingan-vcgroup\u2019s so-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 470.28,
"r_x1": 286.36,
"r_y1": 470.28,
"r_x2": 286.36,
"r_y2": 462.26,
"r_x3": 70.03,
"r_y3": 462.26,
"coord_origin": "TOPLEFT"
},
"text": "lution for icdar 2021 competition on scientific table image",
"orig": "lution for icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 481.24,
"r_x1": 141.87,
"r_y1": 481.24,
"r_x2": 141.87,
"r_y2": 473.22,
"r_x3": 70.03,
"r_y3": 473.22,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex.",
"orig": "recognition to latex.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.1,
"r_y0": 481.03,
"r_x1": 166.02,
"r_y1": 481.03,
"r_x2": 166.02,
"r_y2": 473.3,
"r_x3": 145.1,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "ArXiv",
"orig": "ArXiv",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 166.01,
"r_y0": 481.24,
"r_x1": 259.9,
"r_y1": 481.24,
"r_x2": 259.9,
"r_y2": 473.22,
"r_x3": 166.01,
"r_y3": 473.22,
"coord_origin": "TOPLEFT"
},
"text": ", abs/2105.01846, 2021. 2",
"orig": ", abs/2105.01846, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 492.51,
"r_x1": 66.03,
"r_y1": 492.51,
"r_x2": 66.03,
"r_y2": 484.49,
"r_x3": 50.11,
"r_y3": 484.49,
"coord_origin": "TOPLEFT"
},
"text": "[11]",
"orig": "[11]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.42,
"r_y0": 492.51,
"r_x1": 286.36,
"r_y1": 492.51,
"r_x2": 286.36,
"r_y2": 484.49,
"r_x3": 68.42,
"r_y3": 484.49,
"coord_origin": "TOPLEFT"
},
"text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 503.47,
"r_x1": 286.36,
"r_y1": 503.47,
"r_x2": 286.36,
"r_y2": 495.45,
"r_x3": 70.03,
"r_y3": 495.45,
"coord_origin": "TOPLEFT"
},
"text": "Gordon Wilfong. Medium-independent table detection. In",
"orig": "Gordon Wilfong. Medium-independent table detection. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 514.22,
"r_x1": 227.41,
"r_y1": 514.22,
"r_x2": 227.41,
"r_y2": 506.49,
"r_x3": 70.03,
"r_y3": 506.49,
"coord_origin": "TOPLEFT"
},
"text": "Document Recognition and Retrieval VII",
"orig": "Document Recognition and Retrieval VII",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.41,
"r_y0": 514.42,
"r_x1": 286.36,
"r_y1": 514.42,
"r_x2": 286.36,
"r_y2": 506.41,
"r_x3": 227.41,
"r_y3": 506.41,
"coord_origin": "TOPLEFT"
},
"text": ", volume 3967,",
"orig": ", volume 3967,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 525.38,
"r_x1": 286.36,
"r_y1": 525.38,
"r_x2": 286.36,
"r_y2": 517.37,
"r_x3": 70.03,
"r_y3": 517.37,
"coord_origin": "TOPLEFT"
},
"text": "pages 291-302. International Society for Optics and Photon-",
"orig": "pages 291-302. International Society for Optics and Photon-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 536.34,
"r_x1": 112.36,
"r_y1": 536.34,
"r_x2": 112.36,
"r_y2": 528.33,
"r_x3": 70.03,
"r_y3": 528.33,
"coord_origin": "TOPLEFT"
},
"text": "ics, 1999. 2",
"orig": "ics, 1999. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 547.61,
"r_x1": 65.47,
"r_y1": 547.61,
"r_x2": 65.47,
"r_y2": 539.6,
"r_x3": 50.11,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "[12]",
"orig": "[12]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 547.61,
"r_x1": 286.36,
"r_y1": 547.61,
"r_x2": 286.36,
"r_y2": 539.6,
"r_x3": 67.77,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "Matthew Hurst. A constraint-based approach to table struc-",
"orig": "Matthew Hurst. A constraint-based approach to table struc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 558.57,
"r_x1": 136.28,
"r_y1": 558.57,
"r_x2": 136.28,
"r_y2": 550.56,
"r_x3": 70.03,
"r_y3": 550.56,
"coord_origin": "TOPLEFT"
},
"text": "ture derivation. In",
"orig": "ture derivation. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.81,
"r_y0": 558.37,
"r_x1": 286.36,
"r_y1": 558.37,
"r_x2": 286.36,
"r_y2": 550.64,
"r_x3": 138.81,
"r_y3": 550.64,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the Seventh International",
"orig": "Proceedings of the Seventh International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 569.33,
"r_x1": 286.36,
"r_y1": 569.33,
"r_x2": 286.36,
"r_y2": 561.6,
"r_x3": 70.03,
"r_y3": 561.6,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition - Volume",
"orig": "Conference on Document Analysis and Recognition - Volume",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 580.29,
"r_x1": 74.51,
"r_y1": 580.29,
"r_x2": 74.51,
"r_y2": 572.56,
"r_x3": 70.03,
"r_y3": 572.56,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.51,
"r_y0": 580.49,
"r_x1": 286.36,
"r_y1": 580.49,
"r_x2": 286.36,
"r_y2": 572.48,
"r_x3": 74.51,
"r_y3": 572.48,
"coord_origin": "TOPLEFT"
},
"text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 591.45,
"r_x1": 90.36,
"r_y1": 591.45,
"r_x2": 90.36,
"r_y2": 583.43,
"r_x3": 70.03,
"r_y3": 583.43,
"coord_origin": "TOPLEFT"
},
"text": "ety. 2",
"orig": "ety. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 602.72,
"r_x1": 66.27,
"r_y1": 602.72,
"r_x2": 66.27,
"r_y2": 594.71,
"r_x3": 50.11,
"r_y3": 594.71,
"coord_origin": "TOPLEFT"
},
"text": "[13]",
"orig": "[13]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 602.72,
"r_x1": 286.36,
"r_y1": 602.72,
"r_x2": 286.36,
"r_y2": 594.71,
"r_x3": 68.7,
"r_y3": 594.71,
"coord_origin": "TOPLEFT"
},
"text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 613.68,
"r_x1": 286.36,
"r_y1": 613.68,
"r_x2": 286.36,
"r_y2": 605.66,
"r_x3": 70.03,
"r_y3": 605.66,
"coord_origin": "TOPLEFT"
},
"text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 624.64,
"r_x1": 286.36,
"r_y1": 624.64,
"r_x2": 286.36,
"r_y2": 616.62,
"r_x3": 70.03,
"r_y3": 616.62,
"coord_origin": "TOPLEFT"
},
"text": "tables in scanned document images using line information.",
"orig": "tables in scanned document images using line information.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 635.6,
"r_x1": 77.5,
"r_y1": 635.6,
"r_x2": 77.5,
"r_y2": 627.58,
"r_x3": 70.03,
"r_y3": 627.58,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.92,
"r_y0": 635.39,
"r_x1": 286.36,
"r_y1": 635.39,
"r_x2": 286.36,
"r_y2": 627.66,
"r_x3": 79.92,
"r_y3": 627.66,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International Conference on Document Analy-",
"orig": "2013 12th International Conference on Document Analy-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 646.35,
"r_x1": 140.68,
"r_y1": 646.35,
"r_x2": 140.68,
"r_y2": 638.62,
"r_x3": 70.03,
"r_y3": 638.62,
"coord_origin": "TOPLEFT"
},
"text": "sis and Recognition",
"orig": "sis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.68,
"r_y0": 646.56,
"r_x1": 264.44,
"r_y1": 646.56,
"r_x2": 264.44,
"r_y2": 638.54,
"r_x3": 140.68,
"r_y3": 638.54,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1185-1189. IEEE, 2013. 2",
"orig": ", pages 1185-1189. IEEE, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 657.83,
"r_x1": 66.53,
"r_y1": 657.83,
"r_x2": 66.53,
"r_y2": 649.81,
"r_x3": 50.11,
"r_y3": 649.81,
"coord_origin": "TOPLEFT"
},
"text": "[14]",
"orig": "[14]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 657.83,
"r_x1": 286.36,
"r_y1": 657.83,
"r_x2": 286.36,
"r_y2": 649.81,
"r_x3": 69.0,
"r_y3": 649.81,
"coord_origin": "TOPLEFT"
},
"text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 668.79,
"r_x1": 93.2,
"r_y1": 668.79,
"r_x2": 93.2,
"r_y2": 660.77,
"r_x3": 70.03,
"r_y3": 660.77,
"coord_origin": "TOPLEFT"
},
"text": "Singh.",
"orig": "Singh.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.2,
"r_y0": 668.79,
"r_x1": 286.36,
"r_y1": 668.79,
"r_x2": 286.36,
"r_y2": 660.77,
"r_x3": 102.2,
"r_y3": 660.77,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2021 competition on scientific table image",
"orig": "Icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 679.75,
"r_x1": 172.0,
"r_y1": 679.75,
"r_x2": 172.0,
"r_y2": 671.73,
"r_x3": 70.03,
"r_y3": 671.73,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex, 2021. 2",
"orig": "recognition to latex, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 691.02,
"r_x1": 65.52,
"r_y1": 691.02,
"r_x2": 65.52,
"r_y2": 683.0,
"r_x3": 50.11,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "[15]",
"orig": "[15]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.83,
"r_y0": 691.02,
"r_x1": 286.36,
"r_y1": 691.02,
"r_x2": 286.36,
"r_y2": 683.0,
"r_x3": 67.83,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Harold W Kuhn. The hungarian method for the assignment",
"orig": "Harold W Kuhn. The hungarian method for the assignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 701.98,
"r_x1": 102.16,
"r_y1": 701.98,
"r_x2": 102.16,
"r_y2": 693.96,
"r_x3": 70.03,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "problem.",
"orig": "problem.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 107.55,
"r_y0": 701.77,
"r_x1": 231.47,
"r_y1": 701.77,
"r_x2": 231.47,
"r_y2": 694.04,
"r_x3": 107.55,
"r_y3": 694.04,
"coord_origin": "TOPLEFT"
},
"text": "Naval research logistics quarterly",
"orig": "Naval research logistics quarterly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.48,
"r_y0": 701.98,
"r_x1": 286.36,
"r_y1": 701.98,
"r_x2": 286.36,
"r_y2": 693.96,
"r_x3": 231.48,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": ", 2(1-2):83-97,",
"orig": ", 2(1-2):83-97,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 712.94,
"r_x1": 97.92,
"r_y1": 712.94,
"r_x2": 97.92,
"r_y2": 704.92,
"r_x3": 70.03,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "1955. 6",
"orig": "1955. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 83.9,
"r_x1": 324.75,
"r_y1": 83.9,
"r_x2": 324.75,
"r_y2": 75.88,
"r_x3": 308.86,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "[16]",
"orig": "[16]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.13,
"r_y0": 83.9,
"r_x1": 545.11,
"r_y1": 83.9,
"r_x2": 545.11,
"r_y2": 75.88,
"r_x3": 327.13,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 94.86,
"r_x1": 545.11,
"r_y1": 94.86,
"r_x2": 545.11,
"r_y2": 86.84,
"r_x3": 328.78,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 105.82,
"r_x1": 390.96,
"r_y1": 105.82,
"r_x2": 390.96,
"r_y2": 97.8,
"r_x3": 328.78,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Tamara L. Berg.",
"orig": "Tamara L. Berg.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.27,
"r_y0": 105.82,
"r_x1": 435.14,
"r_y1": 105.82,
"r_x2": 435.14,
"r_y2": 97.8,
"r_x3": 400.27,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Babytalk:",
"orig": "Babytalk:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.71,
"r_y0": 105.82,
"r_x1": 545.11,
"r_y1": 105.82,
"r_x2": 545.11,
"r_y2": 97.8,
"r_x3": 441.71,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Understanding and generat-",
"orig": "Understanding and generat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 116.78,
"r_x1": 440.81,
"r_y1": 116.78,
"r_x2": 440.81,
"r_y2": 108.76,
"r_x3": 328.78,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "ing simple image descriptions.",
"orig": "ing simple image descriptions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 446.63,
"r_y0": 116.57,
"r_x1": 545.11,
"r_y1": 116.57,
"r_x2": 545.11,
"r_y2": 108.84,
"r_x3": 446.63,
"r_y3": 108.84,
"coord_origin": "TOPLEFT"
},
"text": "IEEE Transactions on Pat-",
"orig": "IEEE Transactions on Pat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 127.53,
"r_x1": 471.13,
"r_y1": 127.53,
"r_x2": 471.13,
"r_y2": 119.8,
"r_x3": 328.78,
"r_y3": 119.8,
"coord_origin": "TOPLEFT"
},
"text": "tern Analysis and Machine Intelligence",
"orig": "tern Analysis and Machine Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 471.13,
"r_y0": 127.73,
"r_x1": 545.11,
"r_y1": 127.73,
"r_x2": 545.11,
"r_y2": 119.72,
"r_x3": 471.13,
"r_y3": 119.72,
"coord_origin": "TOPLEFT"
},
"text": ", 35(12):2891-2903,",
"orig": ", 35(12):2891-2903,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 138.69,
"r_x1": 356.67,
"r_y1": 138.69,
"r_x2": 356.67,
"r_y2": 130.68,
"r_x3": 328.78,
"r_y3": 130.68,
"coord_origin": "TOPLEFT"
},
"text": "2013. 4",
"orig": "2013. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 150.14,
"r_x1": 325.24,
"r_y1": 150.14,
"r_x2": 325.24,
"r_y2": 142.12,
"r_x3": 308.86,
"r_y3": 142.12,
"coord_origin": "TOPLEFT"
},
"text": "[17]",
"orig": "[17]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 150.14,
"r_x1": 545.11,
"r_y1": 150.14,
"r_x2": 545.11,
"r_y2": 142.12,
"r_x3": 327.7,
"r_y3": 142.12,
"coord_origin": "TOPLEFT"
},
"text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 161.1,
"r_x1": 414.45,
"r_y1": 161.1,
"r_x2": 414.45,
"r_y2": 153.08,
"r_x3": 328.78,
"r_y3": 153.08,
"coord_origin": "TOPLEFT"
},
"text": "Zhou, and Zhoujun Li.",
"orig": "Zhou, and Zhoujun Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 421.83,
"r_y0": 161.1,
"r_x1": 545.11,
"r_y1": 161.1,
"r_x2": 545.11,
"r_y2": 153.08,
"r_x3": 421.83,
"r_y3": 153.08,
"coord_origin": "TOPLEFT"
},
"text": "Tablebank: A benchmark dataset",
"orig": "Tablebank: A benchmark dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 172.06,
"r_x1": 493.63,
"r_y1": 172.06,
"r_x2": 493.63,
"r_y2": 164.04,
"r_x3": 328.78,
"r_y3": 164.04,
"coord_origin": "TOPLEFT"
},
"text": "for table detection and recognition, 2019. 2, 3",
"orig": "for table detection and recognition, 2019. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 183.5,
"r_x1": 324.27,
"r_y1": 183.5,
"r_x2": 324.27,
"r_y2": 175.49,
"r_x3": 308.86,
"r_y3": 175.49,
"coord_origin": "TOPLEFT"
},
"text": "[18]",
"orig": "[18]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.58,
"r_y0": 183.5,
"r_x1": 545.11,
"r_y1": 183.5,
"r_x2": 545.11,
"r_y2": 175.49,
"r_x3": 326.58,
"r_y3": 175.49,
"coord_origin": "TOPLEFT"
},
"text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 194.46,
"r_x1": 545.11,
"r_y1": 194.46,
"r_x2": 545.11,
"r_y2": 186.45,
"r_x3": 328.78,
"r_y3": 186.45,
"coord_origin": "TOPLEFT"
},
"text": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 205.42,
"r_x1": 545.11,
"r_y1": 205.42,
"r_x2": 545.11,
"r_y2": 197.4,
"r_x3": 328.78,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 216.38,
"r_x1": 545.11,
"r_y1": 216.38,
"r_x2": 545.11,
"r_y2": 208.36,
"r_x3": 328.78,
"r_y3": 208.36,
"coord_origin": "TOPLEFT"
},
"text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 227.34,
"r_x1": 479.26,
"r_y1": 227.34,
"r_x2": 479.26,
"r_y2": 219.32,
"r_x3": 328.78,
"r_y3": 219.32,
"coord_origin": "TOPLEFT"
},
"text": "Escalante, and Roberto Vezzani, editors,",
"orig": "Escalante, and Roberto Vezzani, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.12,
"r_y0": 227.13,
"r_x1": 545.11,
"r_y1": 227.13,
"r_x2": 545.11,
"r_y2": 219.4,
"r_x3": 483.12,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "Pattern Recogni-",
"orig": "Pattern Recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 238.09,
"r_x1": 519.4,
"r_y1": 238.09,
"r_x2": 519.4,
"r_y2": 230.36,
"r_x3": 328.78,
"r_y3": 230.36,
"coord_origin": "TOPLEFT"
},
"text": "tion. ICPR International Workshops and Challenges",
"orig": "tion. ICPR International Workshops and Challenges",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 519.4,
"r_y0": 238.3,
"r_x1": 545.11,
"r_y1": 238.3,
"r_x2": 545.11,
"r_y2": 230.28,
"r_x3": 519.4,
"r_y3": 230.28,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 249.26,
"r_x1": 545.11,
"r_y1": 249.26,
"r_x2": 545.11,
"r_y2": 241.24,
"r_x3": 328.78,
"r_y3": 241.24,
"coord_origin": "TOPLEFT"
},
"text": "644-658, Cham, 2021. Springer International Publishing. 2,",
"orig": "644-658, Cham, 2021. Springer International Publishing. 2,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 260.21,
"r_x1": 333.26,
"r_y1": 260.21,
"r_x2": 333.26,
"r_y2": 252.2,
"r_x3": 328.78,
"r_y3": 252.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 271.66,
"r_x1": 324.26,
"r_y1": 271.66,
"r_x2": 324.26,
"r_y2": 263.64,
"r_x3": 308.86,
"r_y3": 263.64,
"coord_origin": "TOPLEFT"
},
"text": "[19]",
"orig": "[19]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.58,
"r_y0": 271.66,
"r_x1": 545.11,
"r_y1": 271.66,
"r_x2": 545.11,
"r_y2": 263.64,
"r_x3": 326.58,
"r_y3": 263.64,
"coord_origin": "TOPLEFT"
},
"text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 282.62,
"r_x1": 545.11,
"r_y1": 282.62,
"r_x2": 545.11,
"r_y2": 274.6,
"r_x3": 328.78,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 293.58,
"r_x1": 545.11,
"r_y1": 293.58,
"r_x2": 545.11,
"r_y2": 285.56,
"r_x3": 328.78,
"r_y3": 285.56,
"coord_origin": "TOPLEFT"
},
"text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 304.54,
"r_x1": 545.11,
"r_y1": 304.54,
"r_x2": 545.11,
"r_y2": 296.52,
"r_x3": 328.78,
"r_y3": 296.52,
"coord_origin": "TOPLEFT"
},
"text": "bust pdf document conversion using recurrent neural net-",
"orig": "bust pdf document conversion using recurrent neural net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 315.5,
"r_x1": 352.85,
"r_y1": 315.5,
"r_x2": 352.85,
"r_y2": 307.48,
"r_x3": 328.78,
"r_y3": 307.48,
"coord_origin": "TOPLEFT"
},
"text": "works.",
"orig": "works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.24,
"r_y0": 315.29,
"r_x1": 545.11,
"r_y1": 315.29,
"r_x2": 545.11,
"r_y2": 307.56,
"r_x3": 360.24,
"r_y3": 307.56,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the AAAI Conference on Artificial",
"orig": "Proceedings of the AAAI Conference on Artificial",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 326.25,
"r_x1": 371.02,
"r_y1": 326.25,
"r_x2": 371.02,
"r_y2": 318.52,
"r_x3": 328.78,
"r_y3": 318.52,
"coord_origin": "TOPLEFT"
},
"text": "Intelligence",
"orig": "Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.02,
"r_y0": 326.45,
"r_x1": 502.26,
"r_y1": 326.45,
"r_x2": 502.26,
"r_y2": 318.44,
"r_x3": 371.02,
"r_y3": 318.44,
"coord_origin": "TOPLEFT"
},
"text": ", 35(17):15137-15145, May 2021. 1",
"orig": ", 35(17):15137-15145, May 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 337.9,
"r_x1": 323.83,
"r_y1": 337.9,
"r_x2": 323.83,
"r_y2": 329.88,
"r_x3": 308.86,
"r_y3": 329.88,
"coord_origin": "TOPLEFT"
},
"text": "[20]",
"orig": "[20]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.07,
"r_y0": 337.9,
"r_x1": 545.11,
"r_y1": 337.9,
"r_x2": 545.11,
"r_y2": 329.88,
"r_x3": 326.07,
"r_y3": 329.88,
"coord_origin": "TOPLEFT"
},
"text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 348.86,
"r_x1": 545.11,
"r_y1": 348.86,
"r_x2": 545.11,
"r_y2": 340.84,
"r_x3": 328.78,
"r_y3": 340.84,
"coord_origin": "TOPLEFT"
},
"text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 359.82,
"r_x1": 382.78,
"r_y1": 359.82,
"r_x2": 382.78,
"r_y2": 351.8,
"r_x3": 328.78,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "in the wild. In",
"orig": "in the wild. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.54,
"r_y0": 359.61,
"r_x1": 545.12,
"r_y1": 359.61,
"r_x2": 545.12,
"r_y2": 351.88,
"r_x3": 385.54,
"r_y3": 351.88,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF International",
"orig": "Proceedings of the IEEE/CVF International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 370.57,
"r_x1": 443.6,
"r_y1": 370.57,
"r_x2": 443.6,
"r_y2": 362.84,
"r_x3": 328.78,
"r_y3": 362.84,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision",
"orig": "Conference on Computer Vision",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 443.59,
"r_y0": 370.78,
"r_x1": 534.49,
"r_y1": 370.78,
"r_x2": 534.49,
"r_y2": 362.76,
"r_x3": 443.59,
"r_y3": 362.76,
"coord_origin": "TOPLEFT"
},
"text": ", pages 944-952, 2021. 2",
"orig": ", pages 944-952, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 382.22,
"r_x1": 324.6,
"r_y1": 382.22,
"r_x2": 324.6,
"r_y2": 374.21,
"r_x3": 308.86,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "[21]",
"orig": "[21]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.96,
"r_y0": 382.22,
"r_x1": 362.66,
"r_y1": 382.22,
"r_x2": 362.66,
"r_y2": 374.21,
"r_x3": 326.96,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Shubham",
"orig": "Shubham",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.69,
"r_y0": 382.22,
"r_x1": 389.61,
"r_y1": 382.22,
"r_x2": 389.61,
"r_y2": 374.21,
"r_x3": 368.69,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Singh",
"orig": "Singh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 395.65,
"r_y0": 382.22,
"r_x1": 424.56,
"r_y1": 382.22,
"r_x2": 424.56,
"r_y2": 374.21,
"r_x3": 395.65,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Paliwal,",
"orig": "Paliwal,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.55,
"r_y0": 382.22,
"r_x1": 438.02,
"r_y1": 382.22,
"r_x2": 438.02,
"r_y2": 374.21,
"r_x3": 431.55,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "D",
"orig": "D",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.06,
"r_y0": 382.22,
"r_x1": 488.5,
"r_y1": 382.22,
"r_x2": 488.5,
"r_y2": 374.21,
"r_x3": 444.06,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Vishwanath,",
"orig": "Vishwanath,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.48,
"r_y0": 382.22,
"r_x1": 515.41,
"r_y1": 382.22,
"r_x2": 515.41,
"r_y2": 374.21,
"r_x3": 495.48,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Rohit",
"orig": "Rohit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 521.45,
"r_y0": 382.22,
"r_x1": 545.11,
"r_y1": 382.22,
"r_x2": 545.11,
"r_y2": 374.21,
"r_x3": 521.45,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Rahul,",
"orig": "Rahul,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 393.18,
"r_x1": 545.11,
"r_y1": 393.18,
"r_x2": 545.11,
"r_y2": 385.17,
"r_x3": 328.78,
"r_y3": 385.17,
"coord_origin": "TOPLEFT"
},
"text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 404.14,
"r_x1": 545.11,
"r_y1": 404.14,
"r_x2": 545.11,
"r_y2": 396.12,
"r_x3": 328.78,
"r_y3": 396.12,
"coord_origin": "TOPLEFT"
},
"text": "ing model for end-to-end table detection and tabular data ex-",
"orig": "ing model for end-to-end table detection and tabular data ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 415.1,
"r_x1": 478.01,
"r_y1": 415.1,
"r_x2": 478.01,
"r_y2": 407.08,
"r_x3": 328.78,
"r_y3": 407.08,
"coord_origin": "TOPLEFT"
},
"text": "traction from scanned document images.",
"orig": "traction from scanned document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 484.07,
"r_y0": 415.1,
"r_x1": 491.54,
"r_y1": 415.1,
"r_x2": 491.54,
"r_y2": 407.08,
"r_x3": 484.07,
"r_y3": 407.08,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.67,
"r_y0": 414.89,
"r_x1": 545.11,
"r_y1": 414.89,
"r_x2": 545.11,
"r_y2": 407.16,
"r_x3": 494.67,
"r_y3": 407.16,
"coord_origin": "TOPLEFT"
},
"text": "2019 Interna-",
"orig": "2019 Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 425.85,
"r_x1": 545.11,
"r_y1": 425.85,
"r_x2": 545.11,
"r_y2": 418.12,
"r_x3": 328.78,
"r_y3": 418.12,
"coord_origin": "TOPLEFT"
},
"text": "tional Conference on Document Analysis and Recognition",
"orig": "tional Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 436.81,
"r_x1": 360.84,
"r_y1": 436.81,
"r_x2": 360.84,
"r_y2": 429.08,
"r_x3": 328.78,
"r_y3": 429.08,
"coord_origin": "TOPLEFT"
},
"text": "(ICDAR)",
"orig": "(ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.84,
"r_y0": 437.02,
"r_x1": 475.63,
"r_y1": 437.02,
"r_x2": 475.63,
"r_y2": 429.0,
"r_x3": 360.84,
"r_y3": 429.0,
"coord_origin": "TOPLEFT"
},
"text": ", pages 128-133. IEEE, 2019. 1",
"orig": ", pages 128-133. IEEE, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.46,
"r_x1": 324.57,
"r_y1": 448.46,
"r_x2": 324.57,
"r_y2": 440.45,
"r_x3": 308.86,
"r_y3": 440.45,
"coord_origin": "TOPLEFT"
},
"text": "[22]",
"orig": "[22]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.93,
"r_y0": 448.46,
"r_x1": 545.11,
"r_y1": 448.46,
"r_x2": 545.11,
"r_y2": 440.45,
"r_x3": 326.93,
"r_y3": 440.45,
"coord_origin": "TOPLEFT"
},
"text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 459.42,
"r_x1": 545.11,
"r_y1": 459.42,
"r_x2": 545.11,
"r_y2": 451.41,
"r_x3": 328.78,
"r_y3": 451.41,
"coord_origin": "TOPLEFT"
},
"text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 470.38,
"r_x1": 545.11,
"r_y1": 470.38,
"r_x2": 545.11,
"r_y2": 462.36,
"r_x3": 328.78,
"r_y3": 462.36,
"coord_origin": "TOPLEFT"
},
"text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 481.34,
"r_x1": 545.11,
"r_y1": 481.34,
"r_x2": 545.11,
"r_y2": 473.32,
"r_x3": 328.78,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 492.3,
"r_x1": 545.11,
"r_y1": 492.3,
"r_x2": 545.11,
"r_y2": 484.28,
"r_x3": 328.78,
"r_y3": 484.28,
"coord_origin": "TOPLEFT"
},
"text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 503.26,
"r_x1": 545.11,
"r_y1": 503.26,
"r_x2": 545.11,
"r_y2": 495.24,
"r_x3": 328.78,
"r_y3": 495.24,
"coord_origin": "TOPLEFT"
},
"text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 514.22,
"r_x1": 545.11,
"r_y1": 514.22,
"r_x2": 545.11,
"r_y2": 506.2,
"r_x3": 328.78,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "perative style, high-performance deep learning library. In H.",
"orig": "perative style, high-performance deep learning library. In H.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 525.17,
"r_x1": 545.11,
"r_y1": 525.17,
"r_x2": 545.11,
"r_y2": 517.16,
"r_x3": 328.78,
"r_y3": 517.16,
"coord_origin": "TOPLEFT"
},
"text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 536.13,
"r_x1": 434.57,
"r_y1": 536.13,
"r_x2": 434.57,
"r_y2": 528.12,
"r_x3": 328.78,
"r_y3": 528.12,
"coord_origin": "TOPLEFT"
},
"text": "Fox, and R. Garnett, editors,",
"orig": "Fox, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.86,
"r_y0": 535.93,
"r_x1": 545.11,
"r_y1": 535.93,
"r_x2": 545.11,
"r_y2": 528.2,
"r_x3": 437.86,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural Informa-",
"orig": "Advances in Neural Informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 546.89,
"r_x1": 425.73,
"r_y1": 546.89,
"r_x2": 425.73,
"r_y2": 539.16,
"r_x3": 328.78,
"r_y3": 539.16,
"coord_origin": "TOPLEFT"
},
"text": "tion Processing Systems 32",
"orig": "tion Processing Systems 32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 425.74,
"r_y0": 547.09,
"r_x1": 545.11,
"r_y1": 547.09,
"r_x2": 545.11,
"r_y2": 539.08,
"r_x3": 425.74,
"r_y3": 539.08,
"coord_origin": "TOPLEFT"
},
"text": ", pages 8024-8035. Curran Asso-",
"orig": ", pages 8024-8035. Curran Asso-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 558.05,
"r_x1": 399.74,
"r_y1": 558.05,
"r_x2": 399.74,
"r_y2": 550.03,
"r_x3": 328.78,
"r_y3": 550.03,
"coord_origin": "TOPLEFT"
},
"text": "ciates, Inc., 2019. 6",
"orig": "ciates, Inc., 2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.5,
"r_x1": 324.5,
"r_y1": 569.5,
"r_x2": 324.5,
"r_y2": 561.48,
"r_x3": 308.86,
"r_y3": 561.48,
"coord_origin": "TOPLEFT"
},
"text": "[23]",
"orig": "[23]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.85,
"r_y0": 569.5,
"r_x1": 545.11,
"r_y1": 569.5,
"r_x2": 545.11,
"r_y2": 561.48,
"r_x3": 326.85,
"r_y3": 561.48,
"coord_origin": "TOPLEFT"
},
"text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 580.46,
"r_x1": 545.11,
"r_y1": 580.46,
"r_x2": 545.11,
"r_y2": 572.44,
"r_x3": 328.78,
"r_y3": 572.44,
"coord_origin": "TOPLEFT"
},
"text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 591.41,
"r_x1": 545.11,
"r_y1": 591.41,
"r_x2": 545.11,
"r_y2": 583.4,
"r_x3": 328.78,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "for end to end table detection and structure recognition from",
"orig": "for end to end table detection and structure recognition from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 602.37,
"r_x1": 431.62,
"r_y1": 602.37,
"r_x2": 431.62,
"r_y2": 594.36,
"r_x3": 328.78,
"r_y3": 594.36,
"coord_origin": "TOPLEFT"
},
"text": "image-based documents. In",
"orig": "image-based documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.69,
"r_y0": 602.17,
"r_x1": 545.11,
"r_y1": 602.17,
"r_x2": 545.11,
"r_y2": 594.44,
"r_x3": 434.69,
"r_y3": 594.44,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF",
"orig": "Proceedings of the IEEE/CVF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 613.13,
"r_x1": 545.11,
"r_y1": 613.13,
"r_x2": 545.11,
"r_y2": 605.4,
"r_x3": 328.78,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision and Pattern Recognition",
"orig": "Conference on Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 624.08,
"r_x1": 367.8,
"r_y1": 624.08,
"r_x2": 367.8,
"r_y2": 616.36,
"r_x3": 328.78,
"r_y3": 616.36,
"coord_origin": "TOPLEFT"
},
"text": "Workshops",
"orig": "Workshops",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.8,
"r_y0": 624.29,
"r_x1": 458.69,
"r_y1": 624.29,
"r_x2": 458.69,
"r_y2": 616.28,
"r_x3": 367.8,
"r_y3": 616.28,
"coord_origin": "TOPLEFT"
},
"text": ", pages 572-573, 2020. 1",
"orig": ", pages 572-573, 2020. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 635.74,
"r_x1": 324.69,
"r_y1": 635.74,
"r_x2": 324.69,
"r_y2": 627.72,
"r_x3": 308.86,
"r_y3": 627.72,
"coord_origin": "TOPLEFT"
},
"text": "[24]",
"orig": "[24]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.07,
"r_y0": 635.74,
"r_x1": 545.11,
"r_y1": 635.74,
"r_x2": 545.11,
"r_y2": 627.72,
"r_x3": 327.07,
"r_y3": 627.72,
"coord_origin": "TOPLEFT"
},
"text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 646.7,
"r_x1": 545.11,
"r_y1": 646.7,
"r_x2": 545.11,
"r_y2": 638.68,
"r_x3": 328.78,
"r_y3": 638.68,
"coord_origin": "TOPLEFT"
},
"text": "Rethinking table recognition using graph neural networks.",
"orig": "Rethinking table recognition using graph neural networks.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 657.65,
"r_x1": 336.25,
"r_y1": 657.65,
"r_x2": 336.25,
"r_y2": 649.64,
"r_x3": 328.78,
"r_y3": 649.64,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 338.1,
"r_y0": 657.45,
"r_x1": 545.12,
"r_y1": 657.45,
"r_x2": 545.12,
"r_y2": 649.72,
"r_x3": 338.1,
"r_y3": 649.72,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 668.41,
"r_x1": 406.32,
"r_y1": 668.41,
"r_x2": 406.32,
"r_y2": 660.68,
"r_x3": 328.78,
"r_y3": 660.68,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.32,
"r_y0": 668.61,
"r_x1": 521.12,
"r_y1": 668.61,
"r_x2": 521.12,
"r_y2": 660.6,
"r_x3": 406.32,
"r_y3": 660.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 142-147. IEEE, 2019. 3",
"orig": ", pages 142-147. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 680.06,
"r_x1": 324.71,
"r_y1": 680.06,
"r_x2": 324.71,
"r_y2": 672.04,
"r_x3": 308.86,
"r_y3": 672.04,
"coord_origin": "TOPLEFT"
},
"text": "[25]",
"orig": "[25]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.09,
"r_y0": 680.06,
"r_x1": 545.11,
"r_y1": 680.06,
"r_x2": 545.11,
"r_y2": 672.04,
"r_x3": 327.09,
"r_y3": 672.04,
"coord_origin": "TOPLEFT"
},
"text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 691.02,
"r_x1": 482.81,
"r_y1": 691.02,
"r_x2": 482.81,
"r_y2": 683.0,
"r_x3": 328.78,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Sadeghian, Ian Reid, and Silvio Savarese.",
"orig": "Sadeghian, Ian Reid, and Silvio Savarese.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.75,
"r_y0": 691.02,
"r_x1": 545.11,
"r_y1": 691.02,
"r_x2": 545.11,
"r_y2": 683.0,
"r_x3": 488.75,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Generalized in-",
"orig": "Generalized in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 701.98,
"r_x1": 545.11,
"r_y1": 701.98,
"r_x2": 545.11,
"r_y2": 693.96,
"r_x3": 328.78,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "tersection over union: A metric and a loss for bounding box",
"orig": "tersection over union: A metric and a loss for bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 712.94,
"r_x1": 379.15,
"r_y1": 712.94,
"r_x2": 379.15,
"r_y2": 704.92,
"r_x3": 328.78,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "regression. In",
"orig": "regression. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 381.62,
"r_y0": 712.73,
"r_x1": 545.11,
"r_y1": 712.73,
"r_x2": 545.11,
"r_y2": 705.0,
"r_x3": 381.62,
"r_y3": 705.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF Conference on",
"orig": "Proceedings of the IEEE/CVF Conference on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 25,
"label": "list_item",
"bbox": {
"l": 70.03,
"t": 75.88,
"r": 286.36,
"b": 116.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.731,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 83.9,
"r_x1": 286.36,
"r_y1": 83.9,
"r_x2": 286.36,
"r_y2": 75.88,
"r_x3": 70.03,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "end object detection with transformers. In Andrea Vedaldi,",
"orig": "end object detection with transformers. In Andrea Vedaldi,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 94.86,
"r_x1": 286.36,
"r_y1": 94.86,
"r_x2": 286.36,
"r_y2": 86.84,
"r_x3": 70.03,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 105.82,
"r_x1": 85.72,
"r_y1": 105.82,
"r_x2": 85.72,
"r_y2": 97.8,
"r_x3": 70.03,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "tors,",
"orig": "tors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 87.89,
"r_y0": 105.61,
"r_x1": 199.93,
"r_y1": 105.61,
"r_x2": 199.93,
"r_y2": 97.88,
"r_x3": 87.89,
"r_y3": 97.88,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision - ECCV 2020",
"orig": "Computer Vision - ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.94,
"r_y0": 105.82,
"r_x1": 286.36,
"r_y1": 105.82,
"r_x2": 286.36,
"r_y2": 97.8,
"r_x3": 199.94,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 213-229, Cham,",
"orig": ", pages 213-229, Cham,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 116.78,
"r_x1": 221.95,
"r_y1": 116.78,
"r_x2": 221.95,
"r_y2": 108.76,
"r_x3": 70.03,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "2020. Springer International Publishing. 5",
"orig": "2020. Springer International Publishing. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 120.03,
"r": 286.36,
"b": 149.97,
"coord_origin": "TOPLEFT"
},
"confidence": 0.937,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 128.05,
"r_x1": 65.21,
"r_y1": 128.05,
"r_x2": 65.21,
"r_y2": 120.03,
"r_x3": 54.6,
"r_y3": 120.03,
"coord_origin": "TOPLEFT"
},
"text": "[2]",
"orig": "[2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.48,
"r_y0": 128.05,
"r_x1": 286.36,
"r_y1": 128.05,
"r_x2": 286.36,
"r_y2": 120.03,
"r_x3": 67.48,
"r_y3": 120.03,
"coord_origin": "TOPLEFT"
},
"text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 139.01,
"r_x1": 179.67,
"r_y1": 139.01,
"r_x2": 179.67,
"r_y2": 130.99,
"r_x3": 70.03,
"r_y3": 130.99,
"coord_origin": "TOPLEFT"
},
"text": "uan Yin, and Xian-Ling Mao.",
"orig": "uan Yin, and Xian-Ling Mao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.58,
"r_y0": 139.01,
"r_x1": 286.36,
"r_y1": 139.01,
"r_x2": 286.36,
"r_y2": 130.99,
"r_x3": 185.58,
"r_y3": 130.99,
"coord_origin": "TOPLEFT"
},
"text": "Complicated table structure",
"orig": "Complicated table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 149.97,
"r_x1": 113.11,
"r_y1": 149.97,
"r_x2": 113.11,
"r_y2": 141.95,
"r_x3": 70.03,
"r_y3": 141.95,
"coord_origin": "TOPLEFT"
},
"text": "recognition.",
"orig": "recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.34,
"r_y0": 149.76,
"r_x1": 235.31,
"r_y1": 149.76,
"r_x2": 235.31,
"r_y2": 142.03,
"r_x3": 116.34,
"r_y3": 142.03,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint arXiv:1908.04729",
"orig": "arXiv preprint arXiv:1908.04729",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 235.31,
"r_y0": 149.97,
"r_x1": 267.68,
"r_y1": 149.97,
"r_x2": 267.68,
"r_y2": 141.95,
"r_x3": 235.31,
"r_y3": 141.95,
"coord_origin": "TOPLEFT"
},
"text": ", 2019. 3",
"orig": ", 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 153.22,
"r": 286.36,
"b": 183.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.938,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 161.24,
"r_x1": 65.1,
"r_y1": 161.24,
"r_x2": 65.1,
"r_y2": 153.22,
"r_x3": 54.6,
"r_y3": 153.22,
"coord_origin": "TOPLEFT"
},
"text": "[3]",
"orig": "[3]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.36,
"r_y0": 161.24,
"r_x1": 218.78,
"r_y1": 161.24,
"r_x2": 218.78,
"r_y2": 153.22,
"r_x3": 67.36,
"r_y3": 153.22,
"coord_origin": "TOPLEFT"
},
"text": "Bertrand Couasnon and Aurelie Lemaitre.",
"orig": "Bertrand Couasnon and Aurelie Lemaitre.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.98,
"r_y0": 161.03,
"r_x1": 286.36,
"r_y1": 161.03,
"r_x2": 286.36,
"r_y2": 153.3,
"r_x3": 220.98,
"r_y3": 153.3,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of Ta-",
"orig": "Recognition of Ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 171.99,
"r_x1": 125.26,
"r_y1": 171.99,
"r_x2": 125.26,
"r_y2": 164.26,
"r_x3": 70.03,
"r_y3": 164.26,
"coord_origin": "TOPLEFT"
},
"text": "bles and Forms",
"orig": "bles and Forms",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.26,
"r_y0": 172.2,
"r_x1": 286.36,
"r_y1": 172.2,
"r_x2": 286.36,
"r_y2": 164.18,
"r_x3": 125.26,
"r_y3": 164.18,
"coord_origin": "TOPLEFT"
},
"text": ", pages 647-677. Springer London, London,",
"orig": ", pages 647-677. Springer London, London,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 183.15,
"r_x1": 97.92,
"r_y1": 183.15,
"r_x2": 97.92,
"r_y2": 175.14,
"r_x3": 70.03,
"r_y3": 175.14,
"coord_origin": "TOPLEFT"
},
"text": "2014. 2",
"orig": "2014. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 186.41,
"r": 286.36,
"b": 227.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.965,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 194.43,
"r_x1": 65.81,
"r_y1": 194.43,
"r_x2": 65.81,
"r_y2": 186.41,
"r_x3": 54.59,
"r_y3": 186.41,
"coord_origin": "TOPLEFT"
},
"text": "[4]",
"orig": "[4]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.21,
"r_y0": 194.43,
"r_x1": 286.36,
"r_y1": 194.43,
"r_x2": 286.36,
"r_y2": 186.41,
"r_x3": 68.21,
"r_y3": 186.41,
"coord_origin": "TOPLEFT"
},
"text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 205.39,
"r_x1": 286.36,
"r_y1": 205.39,
"r_x2": 286.36,
"r_y2": 197.37,
"r_x3": 70.03,
"r_y3": 197.37,
"coord_origin": "TOPLEFT"
},
"text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 216.34,
"r_x1": 286.36,
"r_y1": 216.34,
"r_x2": 286.36,
"r_y2": 208.33,
"r_x3": 70.03,
"r_y3": 208.33,
"coord_origin": "TOPLEFT"
},
"text": "DAR 2019 Competition on Table Detection and Recognition",
"orig": "DAR 2019 Competition on Table Detection and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 227.3,
"r_x1": 245.84,
"r_y1": 227.3,
"r_x2": 245.84,
"r_y2": 219.29,
"r_x3": 70.03,
"r_y3": 219.29,
"coord_origin": "TOPLEFT"
},
"text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 230.56,
"r": 286.36,
"b": 271.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 238.58,
"r_x1": 65.38,
"r_y1": 238.58,
"r_x2": 65.38,
"r_y2": 230.56,
"r_x3": 54.59,
"r_y3": 230.56,
"coord_origin": "TOPLEFT"
},
"text": "[5]",
"orig": "[5]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.69,
"r_y0": 238.58,
"r_x1": 286.36,
"r_y1": 238.58,
"r_x2": 286.36,
"r_y2": 230.56,
"r_x3": 67.69,
"r_y3": 230.56,
"coord_origin": "TOPLEFT"
},
"text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 249.53,
"r_x1": 286.36,
"r_y1": 249.53,
"r_x2": 286.36,
"r_y2": 241.52,
"r_x3": 70.03,
"r_y3": 241.52,
"coord_origin": "TOPLEFT"
},
"text": "Stavros J Perantonis. Automatic table detection in document",
"orig": "Stavros J Perantonis. Automatic table detection in document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 260.49,
"r_x1": 108.4,
"r_y1": 260.49,
"r_x2": 108.4,
"r_y2": 252.48,
"r_x3": 70.03,
"r_y3": 252.48,
"coord_origin": "TOPLEFT"
},
"text": "images. In",
"orig": "images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.64,
"r_y0": 260.29,
"r_x1": 286.36,
"r_y1": 260.29,
"r_x2": 286.36,
"r_y2": 252.56,
"r_x3": 110.64,
"r_y3": 252.56,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Pattern Recognition",
"orig": "International Conference on Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 271.25,
"r_x1": 140.58,
"r_y1": 271.25,
"r_x2": 140.58,
"r_y2": 263.52,
"r_x3": 70.03,
"r_y3": 263.52,
"coord_origin": "TOPLEFT"
},
"text": "and Image Analysis",
"orig": "and Image Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.58,
"r_y0": 271.45,
"r_x1": 266.48,
"r_y1": 271.45,
"r_x2": 266.48,
"r_y2": 263.44,
"r_x3": 140.58,
"r_y3": 263.44,
"coord_origin": "TOPLEFT"
},
"text": ", pages 609-618. Springer, 2005. 2",
"orig": ", pages 609-618. Springer, 2005. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 274.71,
"r": 286.37,
"b": 315.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 282.72,
"r_x1": 64.85,
"r_y1": 282.72,
"r_x2": 64.85,
"r_y2": 274.71,
"r_x3": 54.59,
"r_y3": 274.71,
"coord_origin": "TOPLEFT"
},
"text": "[6]",
"orig": "[6]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.05,
"r_y0": 282.72,
"r_x1": 286.37,
"r_y1": 282.72,
"r_x2": 286.37,
"r_y2": 274.71,
"r_x3": 67.05,
"r_y3": 274.71,
"coord_origin": "TOPLEFT"
},
"text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 293.68,
"r_x1": 179.57,
"r_y1": 293.68,
"r_x2": 179.57,
"r_y2": 285.67,
"r_x3": 70.03,
"r_y3": 285.67,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2013 table competition.",
"orig": "Icdar 2013 table competition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.02,
"r_y0": 293.68,
"r_x1": 194.48,
"r_y1": 293.68,
"r_x2": 194.48,
"r_y2": 285.67,
"r_x3": 187.02,
"r_y3": 285.67,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.04,
"r_y0": 293.48,
"r_x1": 286.36,
"r_y1": 293.48,
"r_x2": 286.36,
"r_y2": 285.75,
"r_x3": 198.04,
"r_y3": 285.75,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International",
"orig": "2013 12th International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 304.44,
"r_x1": 260.2,
"r_y1": 304.44,
"r_x2": 260.2,
"r_y2": 296.71,
"r_x3": 70.03,
"r_y3": 296.71,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition",
"orig": "Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.2,
"r_y0": 304.64,
"r_x1": 286.36,
"r_y1": 304.64,
"r_x2": 286.36,
"r_y2": 296.63,
"r_x3": 260.2,
"r_y3": 296.63,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 315.6,
"r_x1": 142.75,
"r_y1": 315.6,
"r_x2": 142.75,
"r_y2": 307.58,
"r_x3": 70.03,
"r_y3": 307.58,
"coord_origin": "TOPLEFT"
},
"text": "1449-1453, 2013. 2",
"orig": "1449-1453, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 318.86,
"r": 286.36,
"b": 348.79,
"coord_origin": "TOPLEFT"
},
"confidence": 0.948,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 326.87,
"r_x1": 65.62,
"r_y1": 326.87,
"r_x2": 65.62,
"r_y2": 318.86,
"r_x3": 54.59,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "[7]",
"orig": "[7]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.98,
"r_y0": 326.87,
"r_x1": 199.49,
"r_y1": 326.87,
"r_x2": 199.49,
"r_y2": 318.86,
"r_x3": 67.98,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "EA Green and M Krishnamoorthy.",
"orig": "EA Green and M Krishnamoorthy.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.99,
"r_y0": 326.87,
"r_x1": 286.36,
"r_y1": 326.87,
"r_x2": 286.36,
"r_y2": 318.86,
"r_x3": 206.99,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of tables",
"orig": "Recognition of tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 337.83,
"r_x1": 176.28,
"r_y1": 337.83,
"r_x2": 176.28,
"r_y2": 329.81,
"r_x3": 70.03,
"r_y3": 329.81,
"coord_origin": "TOPLEFT"
},
"text": "using table grammars. procs.",
"orig": "using table grammars. procs.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 337.83,
"r_x1": 190.07,
"r_y1": 337.83,
"r_x2": 190.07,
"r_y2": 329.81,
"r_x3": 182.6,
"r_y3": 329.81,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 193.28,
"r_y0": 337.62,
"r_x1": 286.36,
"r_y1": 337.62,
"r_x2": 286.36,
"r_y2": 329.9,
"r_x3": 193.28,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Symposium on Document",
"orig": "Symposium on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 348.58,
"r_x1": 206.35,
"r_y1": 348.58,
"r_x2": 206.35,
"r_y2": 340.85,
"r_x3": 70.03,
"r_y3": 340.85,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (SDAIR\u201995)",
"orig": "Analysis and Recognition (SDAIR\u201995)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.35,
"r_y0": 348.79,
"r_x1": 274.82,
"r_y1": 348.79,
"r_x2": 274.82,
"r_y2": 340.77,
"r_x3": 206.35,
"r_y3": 340.77,
"coord_origin": "TOPLEFT"
},
"text": ", pages 261-277. 2",
"orig": ", pages 261-277. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 352.05,
"r": 286.36,
"b": 403.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.948,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 360.06,
"r_x1": 65.05,
"r_y1": 360.06,
"r_x2": 65.05,
"r_y2": 352.05,
"r_x3": 54.59,
"r_y3": 352.05,
"coord_origin": "TOPLEFT"
},
"text": "[8]",
"orig": "[8]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.29,
"r_y0": 360.06,
"r_x1": 286.36,
"r_y1": 360.06,
"r_x2": 286.36,
"r_y2": 352.05,
"r_x3": 67.29,
"r_y3": 352.05,
"coord_origin": "TOPLEFT"
},
"text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 371.02,
"r_x1": 234.13,
"r_y1": 371.02,
"r_x2": 234.13,
"r_y2": 363.0,
"r_x3": 70.03,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "dier Stricker, and Muhammad Zeshan Afzal.",
"orig": "dier Stricker, and Muhammad Zeshan Afzal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.05,
"r_y0": 371.02,
"r_x1": 286.36,
"r_y1": 371.02,
"r_x2": 286.36,
"r_y2": 363.0,
"r_x3": 240.05,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "Castabdetec-",
"orig": "Castabdetec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 381.98,
"r_x1": 286.36,
"r_y1": 381.98,
"r_x2": 286.36,
"r_y2": 373.96,
"r_x3": 70.03,
"r_y3": 373.96,
"coord_origin": "TOPLEFT"
},
"text": "tors: Cascade network for table detection in document im-",
"orig": "tors: Cascade network for table detection in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 392.94,
"r_x1": 286.36,
"r_y1": 392.94,
"r_x2": 286.36,
"r_y2": 384.92,
"r_x3": 70.03,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "ages with recursive feature pyramid and switchable atrous",
"orig": "ages with recursive feature pyramid and switchable atrous",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 403.9,
"r_x1": 114.58,
"r_y1": 403.9,
"r_x2": 114.58,
"r_y2": 395.88,
"r_x3": 70.03,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": "convolution.",
"orig": "convolution.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.8,
"r_y0": 403.69,
"r_x1": 186.73,
"r_y1": 403.69,
"r_x2": 186.73,
"r_y2": 395.96,
"r_x3": 117.8,
"r_y3": 395.96,
"coord_origin": "TOPLEFT"
},
"text": "Journal of Imaging",
"orig": "Journal of Imaging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 186.73,
"r_y0": 403.9,
"r_x1": 243.0,
"r_y1": 403.9,
"r_x2": 243.0,
"r_y2": 395.88,
"r_x3": 186.73,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": ", 7(10), 2021. 1",
"orig": ", 7(10), 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 407.15,
"r": 286.36,
"b": 437.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.933,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 415.17,
"r_x1": 65.33,
"r_y1": 415.17,
"r_x2": 65.33,
"r_y2": 407.15,
"r_x3": 54.6,
"r_y3": 407.15,
"coord_origin": "TOPLEFT"
},
"text": "[9]",
"orig": "[9]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.64,
"r_y0": 415.17,
"r_x1": 286.36,
"r_y1": 415.17,
"r_x2": 286.36,
"r_y2": 407.15,
"r_x3": 67.64,
"r_y3": 407.15,
"coord_origin": "TOPLEFT"
},
"text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 426.13,
"r_x1": 147.13,
"r_y1": 426.13,
"r_x2": 147.13,
"r_y2": 418.11,
"r_x3": 70.03,
"r_y3": 418.11,
"coord_origin": "TOPLEFT"
},
"text": "shick. Mask r-cnn. In",
"orig": "shick. Mask r-cnn. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.16,
"r_y0": 425.92,
"r_x1": 286.36,
"r_y1": 425.92,
"r_x2": 286.36,
"r_y2": 418.19,
"r_x3": 149.16,
"r_y3": 418.19,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE International",
"orig": "Proceedings of the IEEE International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 436.88,
"r_x1": 213.48,
"r_y1": 436.88,
"r_x2": 213.48,
"r_y2": 429.15,
"r_x3": 70.03,
"r_y3": 429.15,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision (ICCV)",
"orig": "Conference on Computer Vision (ICCV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.48,
"r_y0": 437.09,
"r_x1": 261.04,
"r_y1": 437.09,
"r_x2": 261.04,
"r_y2": 429.07,
"r_x3": 213.48,
"r_y3": 429.07,
"coord_origin": "TOPLEFT"
},
"text": ", Oct 2017. 1",
"orig": ", Oct 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 440.34,
"r": 286.36,
"b": 481.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.927,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 448.36,
"r_x1": 65.4,
"r_y1": 448.36,
"r_x2": 65.4,
"r_y2": 440.34,
"r_x3": 50.11,
"r_y3": 440.34,
"coord_origin": "TOPLEFT"
},
"text": "[10]",
"orig": "[10]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.69,
"r_y0": 448.36,
"r_x1": 286.36,
"r_y1": 448.36,
"r_x2": 286.36,
"r_y2": 440.34,
"r_x3": 67.69,
"r_y3": 440.34,
"coord_origin": "TOPLEFT"
},
"text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 459.32,
"r_x1": 202.74,
"r_y1": 459.32,
"r_x2": 202.74,
"r_y2": 451.3,
"r_x3": 70.03,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "cong Li, Xin Tang, and Rong Xiao.",
"orig": "cong Li, Xin Tang, and Rong Xiao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 459.32,
"r_x1": 286.36,
"r_y1": 459.32,
"r_x2": 286.36,
"r_y2": 451.3,
"r_x3": 209.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "Pingan-vcgroup\u2019s so-",
"orig": "Pingan-vcgroup\u2019s so-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 470.28,
"r_x1": 286.36,
"r_y1": 470.28,
"r_x2": 286.36,
"r_y2": 462.26,
"r_x3": 70.03,
"r_y3": 462.26,
"coord_origin": "TOPLEFT"
},
"text": "lution for icdar 2021 competition on scientific table image",
"orig": "lution for icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 481.24,
"r_x1": 141.87,
"r_y1": 481.24,
"r_x2": 141.87,
"r_y2": 473.22,
"r_x3": 70.03,
"r_y3": 473.22,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex.",
"orig": "recognition to latex.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.1,
"r_y0": 481.03,
"r_x1": 166.02,
"r_y1": 481.03,
"r_x2": 166.02,
"r_y2": 473.3,
"r_x3": 145.1,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "ArXiv",
"orig": "ArXiv",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 166.01,
"r_y0": 481.24,
"r_x1": 259.9,
"r_y1": 481.24,
"r_x2": 259.9,
"r_y2": 473.22,
"r_x3": 166.01,
"r_y3": 473.22,
"coord_origin": "TOPLEFT"
},
"text": ", abs/2105.01846, 2021. 2",
"orig": ", abs/2105.01846, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 484.49,
"r": 286.36,
"b": 536.34,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 492.51,
"r_x1": 66.03,
"r_y1": 492.51,
"r_x2": 66.03,
"r_y2": 484.49,
"r_x3": 50.11,
"r_y3": 484.49,
"coord_origin": "TOPLEFT"
},
"text": "[11]",
"orig": "[11]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.42,
"r_y0": 492.51,
"r_x1": 286.36,
"r_y1": 492.51,
"r_x2": 286.36,
"r_y2": 484.49,
"r_x3": 68.42,
"r_y3": 484.49,
"coord_origin": "TOPLEFT"
},
"text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 503.47,
"r_x1": 286.36,
"r_y1": 503.47,
"r_x2": 286.36,
"r_y2": 495.45,
"r_x3": 70.03,
"r_y3": 495.45,
"coord_origin": "TOPLEFT"
},
"text": "Gordon Wilfong. Medium-independent table detection. In",
"orig": "Gordon Wilfong. Medium-independent table detection. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 514.22,
"r_x1": 227.41,
"r_y1": 514.22,
"r_x2": 227.41,
"r_y2": 506.49,
"r_x3": 70.03,
"r_y3": 506.49,
"coord_origin": "TOPLEFT"
},
"text": "Document Recognition and Retrieval VII",
"orig": "Document Recognition and Retrieval VII",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.41,
"r_y0": 514.42,
"r_x1": 286.36,
"r_y1": 514.42,
"r_x2": 286.36,
"r_y2": 506.41,
"r_x3": 227.41,
"r_y3": 506.41,
"coord_origin": "TOPLEFT"
},
"text": ", volume 3967,",
"orig": ", volume 3967,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 525.38,
"r_x1": 286.36,
"r_y1": 525.38,
"r_x2": 286.36,
"r_y2": 517.37,
"r_x3": 70.03,
"r_y3": 517.37,
"coord_origin": "TOPLEFT"
},
"text": "pages 291-302. International Society for Optics and Photon-",
"orig": "pages 291-302. International Society for Optics and Photon-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 536.34,
"r_x1": 112.36,
"r_y1": 536.34,
"r_x2": 112.36,
"r_y2": 528.33,
"r_x3": 70.03,
"r_y3": 528.33,
"coord_origin": "TOPLEFT"
},
"text": "ics, 1999. 2",
"orig": "ics, 1999. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 539.6,
"r": 286.36,
"b": 591.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 547.61,
"r_x1": 65.47,
"r_y1": 547.61,
"r_x2": 65.47,
"r_y2": 539.6,
"r_x3": 50.11,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "[12]",
"orig": "[12]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 547.61,
"r_x1": 286.36,
"r_y1": 547.61,
"r_x2": 286.36,
"r_y2": 539.6,
"r_x3": 67.77,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "Matthew Hurst. A constraint-based approach to table struc-",
"orig": "Matthew Hurst. A constraint-based approach to table struc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 558.57,
"r_x1": 136.28,
"r_y1": 558.57,
"r_x2": 136.28,
"r_y2": 550.56,
"r_x3": 70.03,
"r_y3": 550.56,
"coord_origin": "TOPLEFT"
},
"text": "ture derivation. In",
"orig": "ture derivation. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.81,
"r_y0": 558.37,
"r_x1": 286.36,
"r_y1": 558.37,
"r_x2": 286.36,
"r_y2": 550.64,
"r_x3": 138.81,
"r_y3": 550.64,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the Seventh International",
"orig": "Proceedings of the Seventh International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 569.33,
"r_x1": 286.36,
"r_y1": 569.33,
"r_x2": 286.36,
"r_y2": 561.6,
"r_x3": 70.03,
"r_y3": 561.6,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition - Volume",
"orig": "Conference on Document Analysis and Recognition - Volume",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 580.29,
"r_x1": 74.51,
"r_y1": 580.29,
"r_x2": 74.51,
"r_y2": 572.56,
"r_x3": 70.03,
"r_y3": 572.56,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.51,
"r_y0": 580.49,
"r_x1": 286.36,
"r_y1": 580.49,
"r_x2": 286.36,
"r_y2": 572.48,
"r_x3": 74.51,
"r_y3": 572.48,
"coord_origin": "TOPLEFT"
},
"text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 591.45,
"r_x1": 90.36,
"r_y1": 591.45,
"r_x2": 90.36,
"r_y2": 583.43,
"r_x3": 70.03,
"r_y3": 583.43,
"coord_origin": "TOPLEFT"
},
"text": "ety. 2",
"orig": "ety. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 594.71,
"r": 286.36,
"b": 646.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 602.72,
"r_x1": 66.27,
"r_y1": 602.72,
"r_x2": 66.27,
"r_y2": 594.71,
"r_x3": 50.11,
"r_y3": 594.71,
"coord_origin": "TOPLEFT"
},
"text": "[13]",
"orig": "[13]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 602.72,
"r_x1": 286.36,
"r_y1": 602.72,
"r_x2": 286.36,
"r_y2": 594.71,
"r_x3": 68.7,
"r_y3": 594.71,
"coord_origin": "TOPLEFT"
},
"text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 613.68,
"r_x1": 286.36,
"r_y1": 613.68,
"r_x2": 286.36,
"r_y2": 605.66,
"r_x3": 70.03,
"r_y3": 605.66,
"coord_origin": "TOPLEFT"
},
"text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 624.64,
"r_x1": 286.36,
"r_y1": 624.64,
"r_x2": 286.36,
"r_y2": 616.62,
"r_x3": 70.03,
"r_y3": 616.62,
"coord_origin": "TOPLEFT"
},
"text": "tables in scanned document images using line information.",
"orig": "tables in scanned document images using line information.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 635.6,
"r_x1": 77.5,
"r_y1": 635.6,
"r_x2": 77.5,
"r_y2": 627.58,
"r_x3": 70.03,
"r_y3": 627.58,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.92,
"r_y0": 635.39,
"r_x1": 286.36,
"r_y1": 635.39,
"r_x2": 286.36,
"r_y2": 627.66,
"r_x3": 79.92,
"r_y3": 627.66,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International Conference on Document Analy-",
"orig": "2013 12th International Conference on Document Analy-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 646.35,
"r_x1": 140.68,
"r_y1": 646.35,
"r_x2": 140.68,
"r_y2": 638.62,
"r_x3": 70.03,
"r_y3": 638.62,
"coord_origin": "TOPLEFT"
},
"text": "sis and Recognition",
"orig": "sis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.68,
"r_y0": 646.56,
"r_x1": 264.44,
"r_y1": 646.56,
"r_x2": 264.44,
"r_y2": 638.54,
"r_x3": 140.68,
"r_y3": 638.54,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1185-1189. IEEE, 2013. 2",
"orig": ", pages 1185-1189. IEEE, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 649.81,
"r": 286.36,
"b": 679.75,
"coord_origin": "TOPLEFT"
},
"confidence": 0.912,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 657.83,
"r_x1": 66.53,
"r_y1": 657.83,
"r_x2": 66.53,
"r_y2": 649.81,
"r_x3": 50.11,
"r_y3": 649.81,
"coord_origin": "TOPLEFT"
},
"text": "[14]",
"orig": "[14]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 657.83,
"r_x1": 286.36,
"r_y1": 657.83,
"r_x2": 286.36,
"r_y2": 649.81,
"r_x3": 69.0,
"r_y3": 649.81,
"coord_origin": "TOPLEFT"
},
"text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 668.79,
"r_x1": 93.2,
"r_y1": 668.79,
"r_x2": 93.2,
"r_y2": 660.77,
"r_x3": 70.03,
"r_y3": 660.77,
"coord_origin": "TOPLEFT"
},
"text": "Singh.",
"orig": "Singh.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.2,
"r_y0": 668.79,
"r_x1": 286.36,
"r_y1": 668.79,
"r_x2": 286.36,
"r_y2": 660.77,
"r_x3": 102.2,
"r_y3": 660.77,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2021 competition on scientific table image",
"orig": "Icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 679.75,
"r_x1": 172.0,
"r_y1": 679.75,
"r_x2": 172.0,
"r_y2": 671.73,
"r_x3": 70.03,
"r_y3": 671.73,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex, 2021. 2",
"orig": "recognition to latex, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 683.0,
"r": 286.36,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.912,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 691.02,
"r_x1": 65.52,
"r_y1": 691.02,
"r_x2": 65.52,
"r_y2": 683.0,
"r_x3": 50.11,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "[15]",
"orig": "[15]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.83,
"r_y0": 691.02,
"r_x1": 286.36,
"r_y1": 691.02,
"r_x2": 286.36,
"r_y2": 683.0,
"r_x3": 67.83,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Harold W Kuhn. The hungarian method for the assignment",
"orig": "Harold W Kuhn. The hungarian method for the assignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 701.98,
"r_x1": 102.16,
"r_y1": 701.98,
"r_x2": 102.16,
"r_y2": 693.96,
"r_x3": 70.03,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "problem.",
"orig": "problem.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 107.55,
"r_y0": 701.77,
"r_x1": 231.47,
"r_y1": 701.77,
"r_x2": 231.47,
"r_y2": 694.04,
"r_x3": 107.55,
"r_y3": 694.04,
"coord_origin": "TOPLEFT"
},
"text": "Naval research logistics quarterly",
"orig": "Naval research logistics quarterly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.48,
"r_y0": 701.98,
"r_x1": 286.36,
"r_y1": 701.98,
"r_x2": 286.36,
"r_y2": 693.96,
"r_x3": 231.48,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": ", 2(1-2):83-97,",
"orig": ", 2(1-2):83-97,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 712.94,
"r_x1": 97.92,
"r_y1": 712.94,
"r_x2": 97.92,
"r_y2": 704.92,
"r_x3": 70.03,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "1955. 6",
"orig": "1955. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 75.88,
"r": 545.11,
"b": 138.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 83.9,
"r_x1": 324.75,
"r_y1": 83.9,
"r_x2": 324.75,
"r_y2": 75.88,
"r_x3": 308.86,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "[16]",
"orig": "[16]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.13,
"r_y0": 83.9,
"r_x1": 545.11,
"r_y1": 83.9,
"r_x2": 545.11,
"r_y2": 75.88,
"r_x3": 327.13,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 94.86,
"r_x1": 545.11,
"r_y1": 94.86,
"r_x2": 545.11,
"r_y2": 86.84,
"r_x3": 328.78,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 105.82,
"r_x1": 390.96,
"r_y1": 105.82,
"r_x2": 390.96,
"r_y2": 97.8,
"r_x3": 328.78,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Tamara L. Berg.",
"orig": "Tamara L. Berg.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.27,
"r_y0": 105.82,
"r_x1": 435.14,
"r_y1": 105.82,
"r_x2": 435.14,
"r_y2": 97.8,
"r_x3": 400.27,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Babytalk:",
"orig": "Babytalk:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.71,
"r_y0": 105.82,
"r_x1": 545.11,
"r_y1": 105.82,
"r_x2": 545.11,
"r_y2": 97.8,
"r_x3": 441.71,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Understanding and generat-",
"orig": "Understanding and generat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 116.78,
"r_x1": 440.81,
"r_y1": 116.78,
"r_x2": 440.81,
"r_y2": 108.76,
"r_x3": 328.78,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "ing simple image descriptions.",
"orig": "ing simple image descriptions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 446.63,
"r_y0": 116.57,
"r_x1": 545.11,
"r_y1": 116.57,
"r_x2": 545.11,
"r_y2": 108.84,
"r_x3": 446.63,
"r_y3": 108.84,
"coord_origin": "TOPLEFT"
},
"text": "IEEE Transactions on Pat-",
"orig": "IEEE Transactions on Pat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 127.53,
"r_x1": 471.13,
"r_y1": 127.53,
"r_x2": 471.13,
"r_y2": 119.8,
"r_x3": 328.78,
"r_y3": 119.8,
"coord_origin": "TOPLEFT"
},
"text": "tern Analysis and Machine Intelligence",
"orig": "tern Analysis and Machine Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 471.13,
"r_y0": 127.73,
"r_x1": 545.11,
"r_y1": 127.73,
"r_x2": 545.11,
"r_y2": 119.72,
"r_x3": 471.13,
"r_y3": 119.72,
"coord_origin": "TOPLEFT"
},
"text": ", 35(12):2891-2903,",
"orig": ", 35(12):2891-2903,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 138.69,
"r_x1": 356.67,
"r_y1": 138.69,
"r_x2": 356.67,
"r_y2": 130.68,
"r_x3": 328.78,
"r_y3": 130.68,
"coord_origin": "TOPLEFT"
},
"text": "2013. 4",
"orig": "2013. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 142.12,
"r": 545.11,
"b": 172.06,
"coord_origin": "TOPLEFT"
},
"confidence": 0.925,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 150.14,
"r_x1": 325.24,
"r_y1": 150.14,
"r_x2": 325.24,
"r_y2": 142.12,
"r_x3": 308.86,
"r_y3": 142.12,
"coord_origin": "TOPLEFT"
},
"text": "[17]",
"orig": "[17]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 150.14,
"r_x1": 545.11,
"r_y1": 150.14,
"r_x2": 545.11,
"r_y2": 142.12,
"r_x3": 327.7,
"r_y3": 142.12,
"coord_origin": "TOPLEFT"
},
"text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 161.1,
"r_x1": 414.45,
"r_y1": 161.1,
"r_x2": 414.45,
"r_y2": 153.08,
"r_x3": 328.78,
"r_y3": 153.08,
"coord_origin": "TOPLEFT"
},
"text": "Zhou, and Zhoujun Li.",
"orig": "Zhou, and Zhoujun Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 421.83,
"r_y0": 161.1,
"r_x1": 545.11,
"r_y1": 161.1,
"r_x2": 545.11,
"r_y2": 153.08,
"r_x3": 421.83,
"r_y3": 153.08,
"coord_origin": "TOPLEFT"
},
"text": "Tablebank: A benchmark dataset",
"orig": "Tablebank: A benchmark dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 172.06,
"r_x1": 493.63,
"r_y1": 172.06,
"r_x2": 493.63,
"r_y2": 164.04,
"r_x3": 328.78,
"r_y3": 164.04,
"coord_origin": "TOPLEFT"
},
"text": "for table detection and recognition, 2019. 2, 3",
"orig": "for table detection and recognition, 2019. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 175.49,
"r": 545.11,
"b": 260.21,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 183.5,
"r_x1": 324.27,
"r_y1": 183.5,
"r_x2": 324.27,
"r_y2": 175.49,
"r_x3": 308.86,
"r_y3": 175.49,
"coord_origin": "TOPLEFT"
},
"text": "[18]",
"orig": "[18]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.58,
"r_y0": 183.5,
"r_x1": 545.11,
"r_y1": 183.5,
"r_x2": 545.11,
"r_y2": 175.49,
"r_x3": 326.58,
"r_y3": 175.49,
"coord_origin": "TOPLEFT"
},
"text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 194.46,
"r_x1": 545.11,
"r_y1": 194.46,
"r_x2": 545.11,
"r_y2": 186.45,
"r_x3": 328.78,
"r_y3": 186.45,
"coord_origin": "TOPLEFT"
},
"text": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 205.42,
"r_x1": 545.11,
"r_y1": 205.42,
"r_x2": 545.11,
"r_y2": 197.4,
"r_x3": 328.78,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 216.38,
"r_x1": 545.11,
"r_y1": 216.38,
"r_x2": 545.11,
"r_y2": 208.36,
"r_x3": 328.78,
"r_y3": 208.36,
"coord_origin": "TOPLEFT"
},
"text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 227.34,
"r_x1": 479.26,
"r_y1": 227.34,
"r_x2": 479.26,
"r_y2": 219.32,
"r_x3": 328.78,
"r_y3": 219.32,
"coord_origin": "TOPLEFT"
},
"text": "Escalante, and Roberto Vezzani, editors,",
"orig": "Escalante, and Roberto Vezzani, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.12,
"r_y0": 227.13,
"r_x1": 545.11,
"r_y1": 227.13,
"r_x2": 545.11,
"r_y2": 219.4,
"r_x3": 483.12,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "Pattern Recogni-",
"orig": "Pattern Recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 238.09,
"r_x1": 519.4,
"r_y1": 238.09,
"r_x2": 519.4,
"r_y2": 230.36,
"r_x3": 328.78,
"r_y3": 230.36,
"coord_origin": "TOPLEFT"
},
"text": "tion. ICPR International Workshops and Challenges",
"orig": "tion. ICPR International Workshops and Challenges",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 519.4,
"r_y0": 238.3,
"r_x1": 545.11,
"r_y1": 238.3,
"r_x2": 545.11,
"r_y2": 230.28,
"r_x3": 519.4,
"r_y3": 230.28,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 249.26,
"r_x1": 545.11,
"r_y1": 249.26,
"r_x2": 545.11,
"r_y2": 241.24,
"r_x3": 328.78,
"r_y3": 241.24,
"coord_origin": "TOPLEFT"
},
"text": "644-658, Cham, 2021. Springer International Publishing. 2,",
"orig": "644-658, Cham, 2021. Springer International Publishing. 2,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 260.21,
"r_x1": 333.26,
"r_y1": 260.21,
"r_x2": 333.26,
"r_y2": 252.2,
"r_x3": 328.78,
"r_y3": 252.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 263.64,
"r": 545.11,
"b": 326.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.937,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 271.66,
"r_x1": 324.26,
"r_y1": 271.66,
"r_x2": 324.26,
"r_y2": 263.64,
"r_x3": 308.86,
"r_y3": 263.64,
"coord_origin": "TOPLEFT"
},
"text": "[19]",
"orig": "[19]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.58,
"r_y0": 271.66,
"r_x1": 545.11,
"r_y1": 271.66,
"r_x2": 545.11,
"r_y2": 263.64,
"r_x3": 326.58,
"r_y3": 263.64,
"coord_origin": "TOPLEFT"
},
"text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 282.62,
"r_x1": 545.11,
"r_y1": 282.62,
"r_x2": 545.11,
"r_y2": 274.6,
"r_x3": 328.78,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 293.58,
"r_x1": 545.11,
"r_y1": 293.58,
"r_x2": 545.11,
"r_y2": 285.56,
"r_x3": 328.78,
"r_y3": 285.56,
"coord_origin": "TOPLEFT"
},
"text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 304.54,
"r_x1": 545.11,
"r_y1": 304.54,
"r_x2": 545.11,
"r_y2": 296.52,
"r_x3": 328.78,
"r_y3": 296.52,
"coord_origin": "TOPLEFT"
},
"text": "bust pdf document conversion using recurrent neural net-",
"orig": "bust pdf document conversion using recurrent neural net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 315.5,
"r_x1": 352.85,
"r_y1": 315.5,
"r_x2": 352.85,
"r_y2": 307.48,
"r_x3": 328.78,
"r_y3": 307.48,
"coord_origin": "TOPLEFT"
},
"text": "works.",
"orig": "works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.24,
"r_y0": 315.29,
"r_x1": 545.11,
"r_y1": 315.29,
"r_x2": 545.11,
"r_y2": 307.56,
"r_x3": 360.24,
"r_y3": 307.56,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the AAAI Conference on Artificial",
"orig": "Proceedings of the AAAI Conference on Artificial",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 326.25,
"r_x1": 371.02,
"r_y1": 326.25,
"r_x2": 371.02,
"r_y2": 318.52,
"r_x3": 328.78,
"r_y3": 318.52,
"coord_origin": "TOPLEFT"
},
"text": "Intelligence",
"orig": "Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.02,
"r_y0": 326.45,
"r_x1": 502.26,
"r_y1": 326.45,
"r_x2": 502.26,
"r_y2": 318.44,
"r_x3": 371.02,
"r_y3": 318.44,
"coord_origin": "TOPLEFT"
},
"text": ", 35(17):15137-15145, May 2021. 1",
"orig": ", 35(17):15137-15145, May 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 329.88,
"r": 545.12,
"b": 370.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.903,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 337.9,
"r_x1": 323.83,
"r_y1": 337.9,
"r_x2": 323.83,
"r_y2": 329.88,
"r_x3": 308.86,
"r_y3": 329.88,
"coord_origin": "TOPLEFT"
},
"text": "[20]",
"orig": "[20]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.07,
"r_y0": 337.9,
"r_x1": 545.11,
"r_y1": 337.9,
"r_x2": 545.11,
"r_y2": 329.88,
"r_x3": 326.07,
"r_y3": 329.88,
"coord_origin": "TOPLEFT"
},
"text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 348.86,
"r_x1": 545.11,
"r_y1": 348.86,
"r_x2": 545.11,
"r_y2": 340.84,
"r_x3": 328.78,
"r_y3": 340.84,
"coord_origin": "TOPLEFT"
},
"text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 359.82,
"r_x1": 382.78,
"r_y1": 359.82,
"r_x2": 382.78,
"r_y2": 351.8,
"r_x3": 328.78,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "in the wild. In",
"orig": "in the wild. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.54,
"r_y0": 359.61,
"r_x1": 545.12,
"r_y1": 359.61,
"r_x2": 545.12,
"r_y2": 351.88,
"r_x3": 385.54,
"r_y3": 351.88,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF International",
"orig": "Proceedings of the IEEE/CVF International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 370.57,
"r_x1": 443.6,
"r_y1": 370.57,
"r_x2": 443.6,
"r_y2": 362.84,
"r_x3": 328.78,
"r_y3": 362.84,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision",
"orig": "Conference on Computer Vision",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 443.59,
"r_y0": 370.78,
"r_x1": 534.49,
"r_y1": 370.78,
"r_x2": 534.49,
"r_y2": 362.76,
"r_x3": 443.59,
"r_y3": 362.76,
"coord_origin": "TOPLEFT"
},
"text": ", pages 944-952, 2021. 2",
"orig": ", pages 944-952, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 374.21,
"r": 545.11,
"b": 437.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.883,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 382.22,
"r_x1": 324.6,
"r_y1": 382.22,
"r_x2": 324.6,
"r_y2": 374.21,
"r_x3": 308.86,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "[21]",
"orig": "[21]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.96,
"r_y0": 382.22,
"r_x1": 362.66,
"r_y1": 382.22,
"r_x2": 362.66,
"r_y2": 374.21,
"r_x3": 326.96,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Shubham",
"orig": "Shubham",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.69,
"r_y0": 382.22,
"r_x1": 389.61,
"r_y1": 382.22,
"r_x2": 389.61,
"r_y2": 374.21,
"r_x3": 368.69,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Singh",
"orig": "Singh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 395.65,
"r_y0": 382.22,
"r_x1": 424.56,
"r_y1": 382.22,
"r_x2": 424.56,
"r_y2": 374.21,
"r_x3": 395.65,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Paliwal,",
"orig": "Paliwal,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.55,
"r_y0": 382.22,
"r_x1": 438.02,
"r_y1": 382.22,
"r_x2": 438.02,
"r_y2": 374.21,
"r_x3": 431.55,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "D",
"orig": "D",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.06,
"r_y0": 382.22,
"r_x1": 488.5,
"r_y1": 382.22,
"r_x2": 488.5,
"r_y2": 374.21,
"r_x3": 444.06,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Vishwanath,",
"orig": "Vishwanath,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.48,
"r_y0": 382.22,
"r_x1": 515.41,
"r_y1": 382.22,
"r_x2": 515.41,
"r_y2": 374.21,
"r_x3": 495.48,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Rohit",
"orig": "Rohit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 521.45,
"r_y0": 382.22,
"r_x1": 545.11,
"r_y1": 382.22,
"r_x2": 545.11,
"r_y2": 374.21,
"r_x3": 521.45,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Rahul,",
"orig": "Rahul,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 393.18,
"r_x1": 545.11,
"r_y1": 393.18,
"r_x2": 545.11,
"r_y2": 385.17,
"r_x3": 328.78,
"r_y3": 385.17,
"coord_origin": "TOPLEFT"
},
"text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 404.14,
"r_x1": 545.11,
"r_y1": 404.14,
"r_x2": 545.11,
"r_y2": 396.12,
"r_x3": 328.78,
"r_y3": 396.12,
"coord_origin": "TOPLEFT"
},
"text": "ing model for end-to-end table detection and tabular data ex-",
"orig": "ing model for end-to-end table detection and tabular data ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 415.1,
"r_x1": 478.01,
"r_y1": 415.1,
"r_x2": 478.01,
"r_y2": 407.08,
"r_x3": 328.78,
"r_y3": 407.08,
"coord_origin": "TOPLEFT"
},
"text": "traction from scanned document images.",
"orig": "traction from scanned document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 484.07,
"r_y0": 415.1,
"r_x1": 491.54,
"r_y1": 415.1,
"r_x2": 491.54,
"r_y2": 407.08,
"r_x3": 484.07,
"r_y3": 407.08,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.67,
"r_y0": 414.89,
"r_x1": 545.11,
"r_y1": 414.89,
"r_x2": 545.11,
"r_y2": 407.16,
"r_x3": 494.67,
"r_y3": 407.16,
"coord_origin": "TOPLEFT"
},
"text": "2019 Interna-",
"orig": "2019 Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 425.85,
"r_x1": 545.11,
"r_y1": 425.85,
"r_x2": 545.11,
"r_y2": 418.12,
"r_x3": 328.78,
"r_y3": 418.12,
"coord_origin": "TOPLEFT"
},
"text": "tional Conference on Document Analysis and Recognition",
"orig": "tional Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 436.81,
"r_x1": 360.84,
"r_y1": 436.81,
"r_x2": 360.84,
"r_y2": 429.08,
"r_x3": 328.78,
"r_y3": 429.08,
"coord_origin": "TOPLEFT"
},
"text": "(ICDAR)",
"orig": "(ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.84,
"r_y0": 437.02,
"r_x1": 475.63,
"r_y1": 437.02,
"r_x2": 475.63,
"r_y2": 429.0,
"r_x3": 360.84,
"r_y3": 429.0,
"coord_origin": "TOPLEFT"
},
"text": ", pages 128-133. IEEE, 2019. 1",
"orig": ", pages 128-133. IEEE, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 440.45,
"r": 545.11,
"b": 558.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.46,
"r_x1": 324.57,
"r_y1": 448.46,
"r_x2": 324.57,
"r_y2": 440.45,
"r_x3": 308.86,
"r_y3": 440.45,
"coord_origin": "TOPLEFT"
},
"text": "[22]",
"orig": "[22]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.93,
"r_y0": 448.46,
"r_x1": 545.11,
"r_y1": 448.46,
"r_x2": 545.11,
"r_y2": 440.45,
"r_x3": 326.93,
"r_y3": 440.45,
"coord_origin": "TOPLEFT"
},
"text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 459.42,
"r_x1": 545.11,
"r_y1": 459.42,
"r_x2": 545.11,
"r_y2": 451.41,
"r_x3": 328.78,
"r_y3": 451.41,
"coord_origin": "TOPLEFT"
},
"text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 470.38,
"r_x1": 545.11,
"r_y1": 470.38,
"r_x2": 545.11,
"r_y2": 462.36,
"r_x3": 328.78,
"r_y3": 462.36,
"coord_origin": "TOPLEFT"
},
"text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 481.34,
"r_x1": 545.11,
"r_y1": 481.34,
"r_x2": 545.11,
"r_y2": 473.32,
"r_x3": 328.78,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 492.3,
"r_x1": 545.11,
"r_y1": 492.3,
"r_x2": 545.11,
"r_y2": 484.28,
"r_x3": 328.78,
"r_y3": 484.28,
"coord_origin": "TOPLEFT"
},
"text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 503.26,
"r_x1": 545.11,
"r_y1": 503.26,
"r_x2": 545.11,
"r_y2": 495.24,
"r_x3": 328.78,
"r_y3": 495.24,
"coord_origin": "TOPLEFT"
},
"text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 514.22,
"r_x1": 545.11,
"r_y1": 514.22,
"r_x2": 545.11,
"r_y2": 506.2,
"r_x3": 328.78,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "perative style, high-performance deep learning library. In H.",
"orig": "perative style, high-performance deep learning library. In H.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 525.17,
"r_x1": 545.11,
"r_y1": 525.17,
"r_x2": 545.11,
"r_y2": 517.16,
"r_x3": 328.78,
"r_y3": 517.16,
"coord_origin": "TOPLEFT"
},
"text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 536.13,
"r_x1": 434.57,
"r_y1": 536.13,
"r_x2": 434.57,
"r_y2": 528.12,
"r_x3": 328.78,
"r_y3": 528.12,
"coord_origin": "TOPLEFT"
},
"text": "Fox, and R. Garnett, editors,",
"orig": "Fox, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.86,
"r_y0": 535.93,
"r_x1": 545.11,
"r_y1": 535.93,
"r_x2": 545.11,
"r_y2": 528.2,
"r_x3": 437.86,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural Informa-",
"orig": "Advances in Neural Informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 546.89,
"r_x1": 425.73,
"r_y1": 546.89,
"r_x2": 425.73,
"r_y2": 539.16,
"r_x3": 328.78,
"r_y3": 539.16,
"coord_origin": "TOPLEFT"
},
"text": "tion Processing Systems 32",
"orig": "tion Processing Systems 32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 425.74,
"r_y0": 547.09,
"r_x1": 545.11,
"r_y1": 547.09,
"r_x2": 545.11,
"r_y2": 539.08,
"r_x3": 425.74,
"r_y3": 539.08,
"coord_origin": "TOPLEFT"
},
"text": ", pages 8024-8035. Curran Asso-",
"orig": ", pages 8024-8035. Curran Asso-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 558.05,
"r_x1": 399.74,
"r_y1": 558.05,
"r_x2": 399.74,
"r_y2": 550.03,
"r_x3": 328.78,
"r_y3": 550.03,
"coord_origin": "TOPLEFT"
},
"text": "ciates, Inc., 2019. 6",
"orig": "ciates, Inc., 2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 561.48,
"r": 545.11,
"b": 624.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.903,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.5,
"r_x1": 324.5,
"r_y1": 569.5,
"r_x2": 324.5,
"r_y2": 561.48,
"r_x3": 308.86,
"r_y3": 561.48,
"coord_origin": "TOPLEFT"
},
"text": "[23]",
"orig": "[23]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.85,
"r_y0": 569.5,
"r_x1": 545.11,
"r_y1": 569.5,
"r_x2": 545.11,
"r_y2": 561.48,
"r_x3": 326.85,
"r_y3": 561.48,
"coord_origin": "TOPLEFT"
},
"text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 580.46,
"r_x1": 545.11,
"r_y1": 580.46,
"r_x2": 545.11,
"r_y2": 572.44,
"r_x3": 328.78,
"r_y3": 572.44,
"coord_origin": "TOPLEFT"
},
"text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 591.41,
"r_x1": 545.11,
"r_y1": 591.41,
"r_x2": 545.11,
"r_y2": 583.4,
"r_x3": 328.78,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "for end to end table detection and structure recognition from",
"orig": "for end to end table detection and structure recognition from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 602.37,
"r_x1": 431.62,
"r_y1": 602.37,
"r_x2": 431.62,
"r_y2": 594.36,
"r_x3": 328.78,
"r_y3": 594.36,
"coord_origin": "TOPLEFT"
},
"text": "image-based documents. In",
"orig": "image-based documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.69,
"r_y0": 602.17,
"r_x1": 545.11,
"r_y1": 602.17,
"r_x2": 545.11,
"r_y2": 594.44,
"r_x3": 434.69,
"r_y3": 594.44,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF",
"orig": "Proceedings of the IEEE/CVF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 613.13,
"r_x1": 545.11,
"r_y1": 613.13,
"r_x2": 545.11,
"r_y2": 605.4,
"r_x3": 328.78,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision and Pattern Recognition",
"orig": "Conference on Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 624.08,
"r_x1": 367.8,
"r_y1": 624.08,
"r_x2": 367.8,
"r_y2": 616.36,
"r_x3": 328.78,
"r_y3": 616.36,
"coord_origin": "TOPLEFT"
},
"text": "Workshops",
"orig": "Workshops",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.8,
"r_y0": 624.29,
"r_x1": 458.69,
"r_y1": 624.29,
"r_x2": 458.69,
"r_y2": 616.28,
"r_x3": 367.8,
"r_y3": 616.28,
"coord_origin": "TOPLEFT"
},
"text": ", pages 572-573, 2020. 1",
"orig": ", pages 572-573, 2020. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 627.72,
"r": 545.12,
"b": 668.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.878,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 635.74,
"r_x1": 324.69,
"r_y1": 635.74,
"r_x2": 324.69,
"r_y2": 627.72,
"r_x3": 308.86,
"r_y3": 627.72,
"coord_origin": "TOPLEFT"
},
"text": "[24]",
"orig": "[24]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.07,
"r_y0": 635.74,
"r_x1": 545.11,
"r_y1": 635.74,
"r_x2": 545.11,
"r_y2": 627.72,
"r_x3": 327.07,
"r_y3": 627.72,
"coord_origin": "TOPLEFT"
},
"text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 646.7,
"r_x1": 545.11,
"r_y1": 646.7,
"r_x2": 545.11,
"r_y2": 638.68,
"r_x3": 328.78,
"r_y3": 638.68,
"coord_origin": "TOPLEFT"
},
"text": "Rethinking table recognition using graph neural networks.",
"orig": "Rethinking table recognition using graph neural networks.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 657.65,
"r_x1": 336.25,
"r_y1": 657.65,
"r_x2": 336.25,
"r_y2": 649.64,
"r_x3": 328.78,
"r_y3": 649.64,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 338.1,
"r_y0": 657.45,
"r_x1": 545.12,
"r_y1": 657.45,
"r_x2": 545.12,
"r_y2": 649.72,
"r_x3": 338.1,
"r_y3": 649.72,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 668.41,
"r_x1": 406.32,
"r_y1": 668.41,
"r_x2": 406.32,
"r_y2": 660.68,
"r_x3": 328.78,
"r_y3": 660.68,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.32,
"r_y0": 668.61,
"r_x1": 521.12,
"r_y1": 668.61,
"r_x2": 521.12,
"r_y2": 660.6,
"r_x3": 406.32,
"r_y3": 660.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 142-147. IEEE, 2019. 3",
"orig": ", pages 142-147. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 672.04,
"r": 545.11,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.865,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 680.06,
"r_x1": 324.71,
"r_y1": 680.06,
"r_x2": 324.71,
"r_y2": 672.04,
"r_x3": 308.86,
"r_y3": 672.04,
"coord_origin": "TOPLEFT"
},
"text": "[25]",
"orig": "[25]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.09,
"r_y0": 680.06,
"r_x1": 545.11,
"r_y1": 680.06,
"r_x2": 545.11,
"r_y2": 672.04,
"r_x3": 327.09,
"r_y3": 672.04,
"coord_origin": "TOPLEFT"
},
"text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 691.02,
"r_x1": 482.81,
"r_y1": 691.02,
"r_x2": 482.81,
"r_y2": 683.0,
"r_x3": 328.78,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Sadeghian, Ian Reid, and Silvio Savarese.",
"orig": "Sadeghian, Ian Reid, and Silvio Savarese.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.75,
"r_y0": 691.02,
"r_x1": 545.11,
"r_y1": 691.02,
"r_x2": 545.11,
"r_y2": 683.0,
"r_x3": 488.75,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Generalized in-",
"orig": "Generalized in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 701.98,
"r_x1": 545.11,
"r_y1": 701.98,
"r_x2": 545.11,
"r_y2": 693.96,
"r_x3": 328.78,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "tersection over union: A metric and a loss for bounding box",
"orig": "tersection over union: A metric and a loss for bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 712.94,
"r_x1": 379.15,
"r_y1": 712.94,
"r_x2": 379.15,
"r_y2": 704.92,
"r_x3": 328.78,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "regression. In",
"orig": "regression. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 381.62,
"r_y0": 712.73,
"r_x1": 545.11,
"r_y1": 712.73,
"r_x2": 545.11,
"r_y2": 705.0,
"r_x3": 381.62,
"r_y3": 705.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF Conference on",
"orig": "Proceedings of the IEEE/CVF Conference on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "list_item",
"id": 25,
"page_no": 8,
"cluster": {
"id": 25,
"label": "list_item",
"bbox": {
"l": 70.03,
"t": 75.88,
"r": 286.36,
"b": 116.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.731,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 83.9,
"r_x1": 286.36,
"r_y1": 83.9,
"r_x2": 286.36,
"r_y2": 75.88,
"r_x3": 70.03,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "end object detection with transformers. In Andrea Vedaldi,",
"orig": "end object detection with transformers. In Andrea Vedaldi,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 94.86,
"r_x1": 286.36,
"r_y1": 94.86,
"r_x2": 286.36,
"r_y2": 86.84,
"r_x3": 70.03,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 105.82,
"r_x1": 85.72,
"r_y1": 105.82,
"r_x2": 85.72,
"r_y2": 97.8,
"r_x3": 70.03,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "tors,",
"orig": "tors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 87.89,
"r_y0": 105.61,
"r_x1": 199.93,
"r_y1": 105.61,
"r_x2": 199.93,
"r_y2": 97.88,
"r_x3": 87.89,
"r_y3": 97.88,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision - ECCV 2020",
"orig": "Computer Vision - ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.94,
"r_y0": 105.82,
"r_x1": 286.36,
"r_y1": 105.82,
"r_x2": 286.36,
"r_y2": 97.8,
"r_x3": 199.94,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 213-229, Cham,",
"orig": ", pages 213-229, Cham,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 116.78,
"r_x1": 221.95,
"r_y1": 116.78,
"r_x2": 221.95,
"r_y2": 108.76,
"r_x3": 70.03,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "2020. Springer International Publishing. 5",
"orig": "2020. Springer International Publishing. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5"
},
{
"label": "list_item",
"id": 9,
"page_no": 8,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 120.03,
"r": 286.36,
"b": 149.97,
"coord_origin": "TOPLEFT"
},
"confidence": 0.937,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 128.05,
"r_x1": 65.21,
"r_y1": 128.05,
"r_x2": 65.21,
"r_y2": 120.03,
"r_x3": 54.6,
"r_y3": 120.03,
"coord_origin": "TOPLEFT"
},
"text": "[2]",
"orig": "[2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.48,
"r_y0": 128.05,
"r_x1": 286.36,
"r_y1": 128.05,
"r_x2": 286.36,
"r_y2": 120.03,
"r_x3": 67.48,
"r_y3": 120.03,
"coord_origin": "TOPLEFT"
},
"text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 139.01,
"r_x1": 179.67,
"r_y1": 139.01,
"r_x2": 179.67,
"r_y2": 130.99,
"r_x3": 70.03,
"r_y3": 130.99,
"coord_origin": "TOPLEFT"
},
"text": "uan Yin, and Xian-Ling Mao.",
"orig": "uan Yin, and Xian-Ling Mao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.58,
"r_y0": 139.01,
"r_x1": 286.36,
"r_y1": 139.01,
"r_x2": 286.36,
"r_y2": 130.99,
"r_x3": 185.58,
"r_y3": 130.99,
"coord_origin": "TOPLEFT"
},
"text": "Complicated table structure",
"orig": "Complicated table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 149.97,
"r_x1": 113.11,
"r_y1": 149.97,
"r_x2": 113.11,
"r_y2": 141.95,
"r_x3": 70.03,
"r_y3": 141.95,
"coord_origin": "TOPLEFT"
},
"text": "recognition.",
"orig": "recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.34,
"r_y0": 149.76,
"r_x1": 235.31,
"r_y1": 149.76,
"r_x2": 235.31,
"r_y2": 142.03,
"r_x3": 116.34,
"r_y3": 142.03,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint arXiv:1908.04729",
"orig": "arXiv preprint arXiv:1908.04729",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 235.31,
"r_y0": 149.97,
"r_x1": 267.68,
"r_y1": 149.97,
"r_x2": 267.68,
"r_y2": 141.95,
"r_x3": 235.31,
"r_y3": 141.95,
"coord_origin": "TOPLEFT"
},
"text": ", 2019. 3",
"orig": ", 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3"
},
{
"label": "list_item",
"id": 7,
"page_no": 8,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 153.22,
"r": 286.36,
"b": 183.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.938,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 161.24,
"r_x1": 65.1,
"r_y1": 161.24,
"r_x2": 65.1,
"r_y2": 153.22,
"r_x3": 54.6,
"r_y3": 153.22,
"coord_origin": "TOPLEFT"
},
"text": "[3]",
"orig": "[3]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.36,
"r_y0": 161.24,
"r_x1": 218.78,
"r_y1": 161.24,
"r_x2": 218.78,
"r_y2": 153.22,
"r_x3": 67.36,
"r_y3": 153.22,
"coord_origin": "TOPLEFT"
},
"text": "Bertrand Couasnon and Aurelie Lemaitre.",
"orig": "Bertrand Couasnon and Aurelie Lemaitre.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.98,
"r_y0": 161.03,
"r_x1": 286.36,
"r_y1": 161.03,
"r_x2": 286.36,
"r_y2": 153.3,
"r_x3": 220.98,
"r_y3": 153.3,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of Ta-",
"orig": "Recognition of Ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 171.99,
"r_x1": 125.26,
"r_y1": 171.99,
"r_x2": 125.26,
"r_y2": 164.26,
"r_x3": 70.03,
"r_y3": 164.26,
"coord_origin": "TOPLEFT"
},
"text": "bles and Forms",
"orig": "bles and Forms",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.26,
"r_y0": 172.2,
"r_x1": 286.36,
"r_y1": 172.2,
"r_x2": 286.36,
"r_y2": 164.18,
"r_x3": 125.26,
"r_y3": 164.18,
"coord_origin": "TOPLEFT"
},
"text": ", pages 647-677. Springer London, London,",
"orig": ", pages 647-677. Springer London, London,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 183.15,
"r_x1": 97.92,
"r_y1": 183.15,
"r_x2": 97.92,
"r_y2": 175.14,
"r_x3": 70.03,
"r_y3": 175.14,
"coord_origin": "TOPLEFT"
},
"text": "2014. 2",
"orig": "2014. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2"
},
{
"label": "list_item",
"id": 0,
"page_no": 8,
"cluster": {
"id": 0,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 186.41,
"r": 286.36,
"b": 227.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.965,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 194.43,
"r_x1": 65.81,
"r_y1": 194.43,
"r_x2": 65.81,
"r_y2": 186.41,
"r_x3": 54.59,
"r_y3": 186.41,
"coord_origin": "TOPLEFT"
},
"text": "[4]",
"orig": "[4]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.21,
"r_y0": 194.43,
"r_x1": 286.36,
"r_y1": 194.43,
"r_x2": 286.36,
"r_y2": 186.41,
"r_x3": 68.21,
"r_y3": 186.41,
"coord_origin": "TOPLEFT"
},
"text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 205.39,
"r_x1": 286.36,
"r_y1": 205.39,
"r_x2": 286.36,
"r_y2": 197.37,
"r_x3": 70.03,
"r_y3": 197.37,
"coord_origin": "TOPLEFT"
},
"text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 216.34,
"r_x1": 286.36,
"r_y1": 216.34,
"r_x2": 286.36,
"r_y2": 208.33,
"r_x3": 70.03,
"r_y3": 208.33,
"coord_origin": "TOPLEFT"
},
"text": "DAR 2019 Competition on Table Detection and Recognition",
"orig": "DAR 2019 Competition on Table Detection and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 227.3,
"r_x1": 245.84,
"r_y1": 227.3,
"r_x2": 245.84,
"r_y2": 219.29,
"r_x3": 70.03,
"r_y3": 219.29,
"coord_origin": "TOPLEFT"
},
"text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[4] Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2"
},
{
"label": "list_item",
"id": 1,
"page_no": 8,
"cluster": {
"id": 1,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 230.56,
"r": 286.36,
"b": 271.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 238.58,
"r_x1": 65.38,
"r_y1": 238.58,
"r_x2": 65.38,
"r_y2": 230.56,
"r_x3": 54.59,
"r_y3": 230.56,
"coord_origin": "TOPLEFT"
},
"text": "[5]",
"orig": "[5]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.69,
"r_y0": 238.58,
"r_x1": 286.36,
"r_y1": 238.58,
"r_x2": 286.36,
"r_y2": 230.56,
"r_x3": 67.69,
"r_y3": 230.56,
"coord_origin": "TOPLEFT"
},
"text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 249.53,
"r_x1": 286.36,
"r_y1": 249.53,
"r_x2": 286.36,
"r_y2": 241.52,
"r_x3": 70.03,
"r_y3": 241.52,
"coord_origin": "TOPLEFT"
},
"text": "Stavros J Perantonis. Automatic table detection in document",
"orig": "Stavros J Perantonis. Automatic table detection in document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 260.49,
"r_x1": 108.4,
"r_y1": 260.49,
"r_x2": 108.4,
"r_y2": 252.48,
"r_x3": 70.03,
"r_y3": 252.48,
"coord_origin": "TOPLEFT"
},
"text": "images. In",
"orig": "images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.64,
"r_y0": 260.29,
"r_x1": 286.36,
"r_y1": 260.29,
"r_x2": 286.36,
"r_y2": 252.56,
"r_x3": 110.64,
"r_y3": 252.56,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Pattern Recognition",
"orig": "International Conference on Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 271.25,
"r_x1": 140.58,
"r_y1": 271.25,
"r_x2": 140.58,
"r_y2": 263.52,
"r_x3": 70.03,
"r_y3": 263.52,
"coord_origin": "TOPLEFT"
},
"text": "and Image Analysis",
"orig": "and Image Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.58,
"r_y0": 271.45,
"r_x1": 266.48,
"r_y1": 271.45,
"r_x2": 266.48,
"r_y2": 263.44,
"r_x3": 140.58,
"r_y3": 263.44,
"coord_origin": "TOPLEFT"
},
"text": ", pages 609-618. Springer, 2005. 2",
"orig": ", pages 609-618. Springer, 2005. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2"
},
{
"label": "list_item",
"id": 2,
"page_no": 8,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 274.71,
"r": 286.37,
"b": 315.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 282.72,
"r_x1": 64.85,
"r_y1": 282.72,
"r_x2": 64.85,
"r_y2": 274.71,
"r_x3": 54.59,
"r_y3": 274.71,
"coord_origin": "TOPLEFT"
},
"text": "[6]",
"orig": "[6]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.05,
"r_y0": 282.72,
"r_x1": 286.37,
"r_y1": 282.72,
"r_x2": 286.37,
"r_y2": 274.71,
"r_x3": 67.05,
"r_y3": 274.71,
"coord_origin": "TOPLEFT"
},
"text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 293.68,
"r_x1": 179.57,
"r_y1": 293.68,
"r_x2": 179.57,
"r_y2": 285.67,
"r_x3": 70.03,
"r_y3": 285.67,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2013 table competition.",
"orig": "Icdar 2013 table competition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.02,
"r_y0": 293.68,
"r_x1": 194.48,
"r_y1": 293.68,
"r_x2": 194.48,
"r_y2": 285.67,
"r_x3": 187.02,
"r_y3": 285.67,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.04,
"r_y0": 293.48,
"r_x1": 286.36,
"r_y1": 293.48,
"r_x2": 286.36,
"r_y2": 285.75,
"r_x3": 198.04,
"r_y3": 285.75,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International",
"orig": "2013 12th International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 304.44,
"r_x1": 260.2,
"r_y1": 304.44,
"r_x2": 260.2,
"r_y2": 296.71,
"r_x3": 70.03,
"r_y3": 296.71,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition",
"orig": "Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.2,
"r_y0": 304.64,
"r_x1": 286.36,
"r_y1": 304.64,
"r_x2": 286.36,
"r_y2": 296.63,
"r_x3": 260.2,
"r_y3": 296.63,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 315.6,
"r_x1": 142.75,
"r_y1": 315.6,
"r_x2": 142.75,
"r_y2": 307.58,
"r_x3": 70.03,
"r_y3": 307.58,
"coord_origin": "TOPLEFT"
},
"text": "1449-1453, 2013. 2",
"orig": "1449-1453, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[6] Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2"
},
{
"label": "list_item",
"id": 4,
"page_no": 8,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 318.86,
"r": 286.36,
"b": 348.79,
"coord_origin": "TOPLEFT"
},
"confidence": 0.948,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 326.87,
"r_x1": 65.62,
"r_y1": 326.87,
"r_x2": 65.62,
"r_y2": 318.86,
"r_x3": 54.59,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "[7]",
"orig": "[7]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.98,
"r_y0": 326.87,
"r_x1": 199.49,
"r_y1": 326.87,
"r_x2": 199.49,
"r_y2": 318.86,
"r_x3": 67.98,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "EA Green and M Krishnamoorthy.",
"orig": "EA Green and M Krishnamoorthy.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.99,
"r_y0": 326.87,
"r_x1": 286.36,
"r_y1": 326.87,
"r_x2": 286.36,
"r_y2": 318.86,
"r_x3": 206.99,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of tables",
"orig": "Recognition of tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 337.83,
"r_x1": 176.28,
"r_y1": 337.83,
"r_x2": 176.28,
"r_y2": 329.81,
"r_x3": 70.03,
"r_y3": 329.81,
"coord_origin": "TOPLEFT"
},
"text": "using table grammars. procs.",
"orig": "using table grammars. procs.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 337.83,
"r_x1": 190.07,
"r_y1": 337.83,
"r_x2": 190.07,
"r_y2": 329.81,
"r_x3": 182.6,
"r_y3": 329.81,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 193.28,
"r_y0": 337.62,
"r_x1": 286.36,
"r_y1": 337.62,
"r_x2": 286.36,
"r_y2": 329.9,
"r_x3": 193.28,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Symposium on Document",
"orig": "Symposium on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 348.58,
"r_x1": 206.35,
"r_y1": 348.58,
"r_x2": 206.35,
"r_y2": 340.85,
"r_x3": 70.03,
"r_y3": 340.85,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (SDAIR\u201995)",
"orig": "Analysis and Recognition (SDAIR\u201995)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.35,
"r_y0": 348.79,
"r_x1": 274.82,
"r_y1": 348.79,
"r_x2": 274.82,
"r_y2": 340.77,
"r_x3": 206.35,
"r_y3": 340.77,
"coord_origin": "TOPLEFT"
},
"text": ", pages 261-277. 2",
"orig": ", pages 261-277. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2"
},
{
"label": "list_item",
"id": 3,
"page_no": 8,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 352.05,
"r": 286.36,
"b": 403.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.948,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 360.06,
"r_x1": 65.05,
"r_y1": 360.06,
"r_x2": 65.05,
"r_y2": 352.05,
"r_x3": 54.59,
"r_y3": 352.05,
"coord_origin": "TOPLEFT"
},
"text": "[8]",
"orig": "[8]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.29,
"r_y0": 360.06,
"r_x1": 286.36,
"r_y1": 360.06,
"r_x2": 286.36,
"r_y2": 352.05,
"r_x3": 67.29,
"r_y3": 352.05,
"coord_origin": "TOPLEFT"
},
"text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 371.02,
"r_x1": 234.13,
"r_y1": 371.02,
"r_x2": 234.13,
"r_y2": 363.0,
"r_x3": 70.03,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "dier Stricker, and Muhammad Zeshan Afzal.",
"orig": "dier Stricker, and Muhammad Zeshan Afzal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.05,
"r_y0": 371.02,
"r_x1": 286.36,
"r_y1": 371.02,
"r_x2": 286.36,
"r_y2": 363.0,
"r_x3": 240.05,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "Castabdetec-",
"orig": "Castabdetec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 381.98,
"r_x1": 286.36,
"r_y1": 381.98,
"r_x2": 286.36,
"r_y2": 373.96,
"r_x3": 70.03,
"r_y3": 373.96,
"coord_origin": "TOPLEFT"
},
"text": "tors: Cascade network for table detection in document im-",
"orig": "tors: Cascade network for table detection in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 392.94,
"r_x1": 286.36,
"r_y1": 392.94,
"r_x2": 286.36,
"r_y2": 384.92,
"r_x3": 70.03,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "ages with recursive feature pyramid and switchable atrous",
"orig": "ages with recursive feature pyramid and switchable atrous",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 403.9,
"r_x1": 114.58,
"r_y1": 403.9,
"r_x2": 114.58,
"r_y2": 395.88,
"r_x3": 70.03,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": "convolution.",
"orig": "convolution.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.8,
"r_y0": 403.69,
"r_x1": 186.73,
"r_y1": 403.69,
"r_x2": 186.73,
"r_y2": 395.96,
"r_x3": 117.8,
"r_y3": 395.96,
"coord_origin": "TOPLEFT"
},
"text": "Journal of Imaging",
"orig": "Journal of Imaging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 186.73,
"r_y0": 403.9,
"r_x1": 243.0,
"r_y1": 403.9,
"r_x2": 243.0,
"r_y2": 395.88,
"r_x3": 186.73,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": ", 7(10), 2021. 1",
"orig": ", 7(10), 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1"
},
{
"label": "list_item",
"id": 10,
"page_no": 8,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 407.15,
"r": 286.36,
"b": 437.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.933,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 415.17,
"r_x1": 65.33,
"r_y1": 415.17,
"r_x2": 65.33,
"r_y2": 407.15,
"r_x3": 54.6,
"r_y3": 407.15,
"coord_origin": "TOPLEFT"
},
"text": "[9]",
"orig": "[9]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.64,
"r_y0": 415.17,
"r_x1": 286.36,
"r_y1": 415.17,
"r_x2": 286.36,
"r_y2": 407.15,
"r_x3": 67.64,
"r_y3": 407.15,
"coord_origin": "TOPLEFT"
},
"text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 426.13,
"r_x1": 147.13,
"r_y1": 426.13,
"r_x2": 147.13,
"r_y2": 418.11,
"r_x3": 70.03,
"r_y3": 418.11,
"coord_origin": "TOPLEFT"
},
"text": "shick. Mask r-cnn. In",
"orig": "shick. Mask r-cnn. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.16,
"r_y0": 425.92,
"r_x1": 286.36,
"r_y1": 425.92,
"r_x2": 286.36,
"r_y2": 418.19,
"r_x3": 149.16,
"r_y3": 418.19,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE International",
"orig": "Proceedings of the IEEE International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 436.88,
"r_x1": 213.48,
"r_y1": 436.88,
"r_x2": 213.48,
"r_y2": 429.15,
"r_x3": 70.03,
"r_y3": 429.15,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision (ICCV)",
"orig": "Conference on Computer Vision (ICCV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.48,
"r_y0": 437.09,
"r_x1": 261.04,
"r_y1": 437.09,
"r_x2": 261.04,
"r_y2": 429.07,
"r_x3": 213.48,
"r_y3": 429.07,
"coord_origin": "TOPLEFT"
},
"text": ", Oct 2017. 1",
"orig": ", Oct 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1"
},
{
"label": "list_item",
"id": 14,
"page_no": 8,
"cluster": {
"id": 14,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 440.34,
"r": 286.36,
"b": 481.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.927,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 448.36,
"r_x1": 65.4,
"r_y1": 448.36,
"r_x2": 65.4,
"r_y2": 440.34,
"r_x3": 50.11,
"r_y3": 440.34,
"coord_origin": "TOPLEFT"
},
"text": "[10]",
"orig": "[10]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.69,
"r_y0": 448.36,
"r_x1": 286.36,
"r_y1": 448.36,
"r_x2": 286.36,
"r_y2": 440.34,
"r_x3": 67.69,
"r_y3": 440.34,
"coord_origin": "TOPLEFT"
},
"text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 459.32,
"r_x1": 202.74,
"r_y1": 459.32,
"r_x2": 202.74,
"r_y2": 451.3,
"r_x3": 70.03,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "cong Li, Xin Tang, and Rong Xiao.",
"orig": "cong Li, Xin Tang, and Rong Xiao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 459.32,
"r_x1": 286.36,
"r_y1": 459.32,
"r_x2": 286.36,
"r_y2": 451.3,
"r_x3": 209.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "Pingan-vcgroup\u2019s so-",
"orig": "Pingan-vcgroup\u2019s so-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 470.28,
"r_x1": 286.36,
"r_y1": 470.28,
"r_x2": 286.36,
"r_y2": 462.26,
"r_x3": 70.03,
"r_y3": 462.26,
"coord_origin": "TOPLEFT"
},
"text": "lution for icdar 2021 competition on scientific table image",
"orig": "lution for icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 481.24,
"r_x1": 141.87,
"r_y1": 481.24,
"r_x2": 141.87,
"r_y2": 473.22,
"r_x3": 70.03,
"r_y3": 473.22,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex.",
"orig": "recognition to latex.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.1,
"r_y0": 481.03,
"r_x1": 166.02,
"r_y1": 481.03,
"r_x2": 166.02,
"r_y2": 473.3,
"r_x3": 145.1,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "ArXiv",
"orig": "ArXiv",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 166.01,
"r_y0": 481.24,
"r_x1": 259.9,
"r_y1": 481.24,
"r_x2": 259.9,
"r_y2": 473.22,
"r_x3": 166.01,
"r_y3": 473.22,
"coord_origin": "TOPLEFT"
},
"text": ", abs/2105.01846, 2021. 2",
"orig": ", abs/2105.01846, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2"
},
{
"label": "list_item",
"id": 11,
"page_no": 8,
"cluster": {
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 484.49,
"r": 286.36,
"b": 536.34,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 492.51,
"r_x1": 66.03,
"r_y1": 492.51,
"r_x2": 66.03,
"r_y2": 484.49,
"r_x3": 50.11,
"r_y3": 484.49,
"coord_origin": "TOPLEFT"
},
"text": "[11]",
"orig": "[11]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.42,
"r_y0": 492.51,
"r_x1": 286.36,
"r_y1": 492.51,
"r_x2": 286.36,
"r_y2": 484.49,
"r_x3": 68.42,
"r_y3": 484.49,
"coord_origin": "TOPLEFT"
},
"text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 503.47,
"r_x1": 286.36,
"r_y1": 503.47,
"r_x2": 286.36,
"r_y2": 495.45,
"r_x3": 70.03,
"r_y3": 495.45,
"coord_origin": "TOPLEFT"
},
"text": "Gordon Wilfong. Medium-independent table detection. In",
"orig": "Gordon Wilfong. Medium-independent table detection. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 514.22,
"r_x1": 227.41,
"r_y1": 514.22,
"r_x2": 227.41,
"r_y2": 506.49,
"r_x3": 70.03,
"r_y3": 506.49,
"coord_origin": "TOPLEFT"
},
"text": "Document Recognition and Retrieval VII",
"orig": "Document Recognition and Retrieval VII",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.41,
"r_y0": 514.42,
"r_x1": 286.36,
"r_y1": 514.42,
"r_x2": 286.36,
"r_y2": 506.41,
"r_x3": 227.41,
"r_y3": 506.41,
"coord_origin": "TOPLEFT"
},
"text": ", volume 3967,",
"orig": ", volume 3967,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 525.38,
"r_x1": 286.36,
"r_y1": 525.38,
"r_x2": 286.36,
"r_y2": 517.37,
"r_x3": 70.03,
"r_y3": 517.37,
"coord_origin": "TOPLEFT"
},
"text": "pages 291-302. International Society for Optics and Photon-",
"orig": "pages 291-302. International Society for Optics and Photon-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 536.34,
"r_x1": 112.36,
"r_y1": 536.34,
"r_x2": 112.36,
"r_y2": 528.33,
"r_x3": 70.03,
"r_y3": 528.33,
"coord_origin": "TOPLEFT"
},
"text": "ics, 1999. 2",
"orig": "ics, 1999. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2"
},
{
"label": "list_item",
"id": 5,
"page_no": 8,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 539.6,
"r": 286.36,
"b": 591.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 547.61,
"r_x1": 65.47,
"r_y1": 547.61,
"r_x2": 65.47,
"r_y2": 539.6,
"r_x3": 50.11,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "[12]",
"orig": "[12]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 547.61,
"r_x1": 286.36,
"r_y1": 547.61,
"r_x2": 286.36,
"r_y2": 539.6,
"r_x3": 67.77,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "Matthew Hurst. A constraint-based approach to table struc-",
"orig": "Matthew Hurst. A constraint-based approach to table struc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 558.57,
"r_x1": 136.28,
"r_y1": 558.57,
"r_x2": 136.28,
"r_y2": 550.56,
"r_x3": 70.03,
"r_y3": 550.56,
"coord_origin": "TOPLEFT"
},
"text": "ture derivation. In",
"orig": "ture derivation. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.81,
"r_y0": 558.37,
"r_x1": 286.36,
"r_y1": 558.37,
"r_x2": 286.36,
"r_y2": 550.64,
"r_x3": 138.81,
"r_y3": 550.64,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the Seventh International",
"orig": "Proceedings of the Seventh International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 569.33,
"r_x1": 286.36,
"r_y1": 569.33,
"r_x2": 286.36,
"r_y2": 561.6,
"r_x3": 70.03,
"r_y3": 561.6,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition - Volume",
"orig": "Conference on Document Analysis and Recognition - Volume",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 580.29,
"r_x1": 74.51,
"r_y1": 580.29,
"r_x2": 74.51,
"r_y2": 572.56,
"r_x3": 70.03,
"r_y3": 572.56,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.51,
"r_y0": 580.49,
"r_x1": 286.36,
"r_y1": 580.49,
"r_x2": 286.36,
"r_y2": 572.48,
"r_x3": 74.51,
"r_y3": 572.48,
"coord_origin": "TOPLEFT"
},
"text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 591.45,
"r_x1": 90.36,
"r_y1": 591.45,
"r_x2": 90.36,
"r_y2": 583.43,
"r_x3": 70.03,
"r_y3": 583.43,
"coord_origin": "TOPLEFT"
},
"text": "ety. 2",
"orig": "ety. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2"
},
{
"label": "list_item",
"id": 13,
"page_no": 8,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 594.71,
"r": 286.36,
"b": 646.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 602.72,
"r_x1": 66.27,
"r_y1": 602.72,
"r_x2": 66.27,
"r_y2": 594.71,
"r_x3": 50.11,
"r_y3": 594.71,
"coord_origin": "TOPLEFT"
},
"text": "[13]",
"orig": "[13]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 602.72,
"r_x1": 286.36,
"r_y1": 602.72,
"r_x2": 286.36,
"r_y2": 594.71,
"r_x3": 68.7,
"r_y3": 594.71,
"coord_origin": "TOPLEFT"
},
"text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 613.68,
"r_x1": 286.36,
"r_y1": 613.68,
"r_x2": 286.36,
"r_y2": 605.66,
"r_x3": 70.03,
"r_y3": 605.66,
"coord_origin": "TOPLEFT"
},
"text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 624.64,
"r_x1": 286.36,
"r_y1": 624.64,
"r_x2": 286.36,
"r_y2": 616.62,
"r_x3": 70.03,
"r_y3": 616.62,
"coord_origin": "TOPLEFT"
},
"text": "tables in scanned document images using line information.",
"orig": "tables in scanned document images using line information.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 635.6,
"r_x1": 77.5,
"r_y1": 635.6,
"r_x2": 77.5,
"r_y2": 627.58,
"r_x3": 70.03,
"r_y3": 627.58,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.92,
"r_y0": 635.39,
"r_x1": 286.36,
"r_y1": 635.39,
"r_x2": 286.36,
"r_y2": 627.66,
"r_x3": 79.92,
"r_y3": 627.66,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International Conference on Document Analy-",
"orig": "2013 12th International Conference on Document Analy-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 646.35,
"r_x1": 140.68,
"r_y1": 646.35,
"r_x2": 140.68,
"r_y2": 638.62,
"r_x3": 70.03,
"r_y3": 638.62,
"coord_origin": "TOPLEFT"
},
"text": "sis and Recognition",
"orig": "sis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.68,
"r_y0": 646.56,
"r_x1": 264.44,
"r_y1": 646.56,
"r_x2": 264.44,
"r_y2": 638.54,
"r_x3": 140.68,
"r_y3": 638.54,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1185-1189. IEEE, 2013. 2",
"orig": ", pages 1185-1189. IEEE, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2"
},
{
"label": "list_item",
"id": 17,
"page_no": 8,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 649.81,
"r": 286.36,
"b": 679.75,
"coord_origin": "TOPLEFT"
},
"confidence": 0.912,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 657.83,
"r_x1": 66.53,
"r_y1": 657.83,
"r_x2": 66.53,
"r_y2": 649.81,
"r_x3": 50.11,
"r_y3": 649.81,
"coord_origin": "TOPLEFT"
},
"text": "[14]",
"orig": "[14]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 657.83,
"r_x1": 286.36,
"r_y1": 657.83,
"r_x2": 286.36,
"r_y2": 649.81,
"r_x3": 69.0,
"r_y3": 649.81,
"coord_origin": "TOPLEFT"
},
"text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 668.79,
"r_x1": 93.2,
"r_y1": 668.79,
"r_x2": 93.2,
"r_y2": 660.77,
"r_x3": 70.03,
"r_y3": 660.77,
"coord_origin": "TOPLEFT"
},
"text": "Singh.",
"orig": "Singh.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.2,
"r_y0": 668.79,
"r_x1": 286.36,
"r_y1": 668.79,
"r_x2": 286.36,
"r_y2": 660.77,
"r_x3": 102.2,
"r_y3": 660.77,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2021 competition on scientific table image",
"orig": "Icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 679.75,
"r_x1": 172.0,
"r_y1": 679.75,
"r_x2": 172.0,
"r_y2": 671.73,
"r_x3": 70.03,
"r_y3": 671.73,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex, 2021. 2",
"orig": "recognition to latex, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2"
},
{
"label": "list_item",
"id": 16,
"page_no": 8,
"cluster": {
"id": 16,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 683.0,
"r": 286.36,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.912,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 691.02,
"r_x1": 65.52,
"r_y1": 691.02,
"r_x2": 65.52,
"r_y2": 683.0,
"r_x3": 50.11,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "[15]",
"orig": "[15]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.83,
"r_y0": 691.02,
"r_x1": 286.36,
"r_y1": 691.02,
"r_x2": 286.36,
"r_y2": 683.0,
"r_x3": 67.83,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Harold W Kuhn. The hungarian method for the assignment",
"orig": "Harold W Kuhn. The hungarian method for the assignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 701.98,
"r_x1": 102.16,
"r_y1": 701.98,
"r_x2": 102.16,
"r_y2": 693.96,
"r_x3": 70.03,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "problem.",
"orig": "problem.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 107.55,
"r_y0": 701.77,
"r_x1": 231.47,
"r_y1": 701.77,
"r_x2": 231.47,
"r_y2": 694.04,
"r_x3": 107.55,
"r_y3": 694.04,
"coord_origin": "TOPLEFT"
},
"text": "Naval research logistics quarterly",
"orig": "Naval research logistics quarterly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.48,
"r_y0": 701.98,
"r_x1": 286.36,
"r_y1": 701.98,
"r_x2": 286.36,
"r_y2": 693.96,
"r_x3": 231.48,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": ", 2(1-2):83-97,",
"orig": ", 2(1-2):83-97,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 712.94,
"r_x1": 97.92,
"r_y1": 712.94,
"r_x2": 97.92,
"r_y2": 704.92,
"r_x3": 70.03,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "1955. 6",
"orig": "1955. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[15] Harold W Kuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6"
},
{
"label": "list_item",
"id": 6,
"page_no": 8,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 75.88,
"r": 545.11,
"b": 138.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 83.9,
"r_x1": 324.75,
"r_y1": 83.9,
"r_x2": 324.75,
"r_y2": 75.88,
"r_x3": 308.86,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "[16]",
"orig": "[16]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.13,
"r_y0": 83.9,
"r_x1": 545.11,
"r_y1": 83.9,
"r_x2": 545.11,
"r_y2": 75.88,
"r_x3": 327.13,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 94.86,
"r_x1": 545.11,
"r_y1": 94.86,
"r_x2": 545.11,
"r_y2": 86.84,
"r_x3": 328.78,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 105.82,
"r_x1": 390.96,
"r_y1": 105.82,
"r_x2": 390.96,
"r_y2": 97.8,
"r_x3": 328.78,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Tamara L. Berg.",
"orig": "Tamara L. Berg.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.27,
"r_y0": 105.82,
"r_x1": 435.14,
"r_y1": 105.82,
"r_x2": 435.14,
"r_y2": 97.8,
"r_x3": 400.27,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Babytalk:",
"orig": "Babytalk:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.71,
"r_y0": 105.82,
"r_x1": 545.11,
"r_y1": 105.82,
"r_x2": 545.11,
"r_y2": 97.8,
"r_x3": 441.71,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Understanding and generat-",
"orig": "Understanding and generat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 116.78,
"r_x1": 440.81,
"r_y1": 116.78,
"r_x2": 440.81,
"r_y2": 108.76,
"r_x3": 328.78,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "ing simple image descriptions.",
"orig": "ing simple image descriptions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 446.63,
"r_y0": 116.57,
"r_x1": 545.11,
"r_y1": 116.57,
"r_x2": 545.11,
"r_y2": 108.84,
"r_x3": 446.63,
"r_y3": 108.84,
"coord_origin": "TOPLEFT"
},
"text": "IEEE Transactions on Pat-",
"orig": "IEEE Transactions on Pat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 127.53,
"r_x1": 471.13,
"r_y1": 127.53,
"r_x2": 471.13,
"r_y2": 119.8,
"r_x3": 328.78,
"r_y3": 119.8,
"coord_origin": "TOPLEFT"
},
"text": "tern Analysis and Machine Intelligence",
"orig": "tern Analysis and Machine Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 471.13,
"r_y0": 127.73,
"r_x1": 545.11,
"r_y1": 127.73,
"r_x2": 545.11,
"r_y2": 119.72,
"r_x3": 471.13,
"r_y3": 119.72,
"coord_origin": "TOPLEFT"
},
"text": ", 35(12):2891-2903,",
"orig": ", 35(12):2891-2903,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 138.69,
"r_x1": 356.67,
"r_y1": 138.69,
"r_x2": 356.67,
"r_y2": 130.68,
"r_x3": 328.78,
"r_y3": 130.68,
"coord_origin": "TOPLEFT"
},
"text": "2013. 4",
"orig": "2013. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4"
},
{
"label": "list_item",
"id": 15,
"page_no": 8,
"cluster": {
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 142.12,
"r": 545.11,
"b": 172.06,
"coord_origin": "TOPLEFT"
},
"confidence": 0.925,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 150.14,
"r_x1": 325.24,
"r_y1": 150.14,
"r_x2": 325.24,
"r_y2": 142.12,
"r_x3": 308.86,
"r_y3": 142.12,
"coord_origin": "TOPLEFT"
},
"text": "[17]",
"orig": "[17]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 150.14,
"r_x1": 545.11,
"r_y1": 150.14,
"r_x2": 545.11,
"r_y2": 142.12,
"r_x3": 327.7,
"r_y3": 142.12,
"coord_origin": "TOPLEFT"
},
"text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 161.1,
"r_x1": 414.45,
"r_y1": 161.1,
"r_x2": 414.45,
"r_y2": 153.08,
"r_x3": 328.78,
"r_y3": 153.08,
"coord_origin": "TOPLEFT"
},
"text": "Zhou, and Zhoujun Li.",
"orig": "Zhou, and Zhoujun Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 421.83,
"r_y0": 161.1,
"r_x1": 545.11,
"r_y1": 161.1,
"r_x2": 545.11,
"r_y2": 153.08,
"r_x3": 421.83,
"r_y3": 153.08,
"coord_origin": "TOPLEFT"
},
"text": "Tablebank: A benchmark dataset",
"orig": "Tablebank: A benchmark dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 172.06,
"r_x1": 493.63,
"r_y1": 172.06,
"r_x2": 493.63,
"r_y2": 164.04,
"r_x3": 328.78,
"r_y3": 164.04,
"coord_origin": "TOPLEFT"
},
"text": "for table detection and recognition, 2019. 2, 3",
"orig": "for table detection and recognition, 2019. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3"
},
{
"label": "list_item",
"id": 12,
"page_no": 8,
"cluster": {
"id": 12,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 175.49,
"r": 545.11,
"b": 260.21,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 183.5,
"r_x1": 324.27,
"r_y1": 183.5,
"r_x2": 324.27,
"r_y2": 175.49,
"r_x3": 308.86,
"r_y3": 175.49,
"coord_origin": "TOPLEFT"
},
"text": "[18]",
"orig": "[18]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.58,
"r_y0": 183.5,
"r_x1": 545.11,
"r_y1": 183.5,
"r_x2": 545.11,
"r_y2": 175.49,
"r_x3": 326.58,
"r_y3": 175.49,
"coord_origin": "TOPLEFT"
},
"text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 194.46,
"r_x1": 545.11,
"r_y1": 194.46,
"r_x2": 545.11,
"r_y2": 186.45,
"r_x3": 328.78,
"r_y3": 186.45,
"coord_origin": "TOPLEFT"
},
"text": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 205.42,
"r_x1": 545.11,
"r_y1": 205.42,
"r_x2": 545.11,
"r_y2": 197.4,
"r_x3": 328.78,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 216.38,
"r_x1": 545.11,
"r_y1": 216.38,
"r_x2": 545.11,
"r_y2": 208.36,
"r_x3": 328.78,
"r_y3": 208.36,
"coord_origin": "TOPLEFT"
},
"text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 227.34,
"r_x1": 479.26,
"r_y1": 227.34,
"r_x2": 479.26,
"r_y2": 219.32,
"r_x3": 328.78,
"r_y3": 219.32,
"coord_origin": "TOPLEFT"
},
"text": "Escalante, and Roberto Vezzani, editors,",
"orig": "Escalante, and Roberto Vezzani, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.12,
"r_y0": 227.13,
"r_x1": 545.11,
"r_y1": 227.13,
"r_x2": 545.11,
"r_y2": 219.4,
"r_x3": 483.12,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "Pattern Recogni-",
"orig": "Pattern Recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 238.09,
"r_x1": 519.4,
"r_y1": 238.09,
"r_x2": 519.4,
"r_y2": 230.36,
"r_x3": 328.78,
"r_y3": 230.36,
"coord_origin": "TOPLEFT"
},
"text": "tion. ICPR International Workshops and Challenges",
"orig": "tion. ICPR International Workshops and Challenges",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 519.4,
"r_y0": 238.3,
"r_x1": 545.11,
"r_y1": 238.3,
"r_x2": 545.11,
"r_y2": 230.28,
"r_x3": 519.4,
"r_y3": 230.28,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 249.26,
"r_x1": 545.11,
"r_y1": 249.26,
"r_x2": 545.11,
"r_y2": 241.24,
"r_x3": 328.78,
"r_y3": 241.24,
"coord_origin": "TOPLEFT"
},
"text": "644-658, Cham, 2021. Springer International Publishing. 2,",
"orig": "644-658, Cham, 2021. Springer International Publishing. 2,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 260.21,
"r_x1": 333.26,
"r_y1": 260.21,
"r_x2": 333.26,
"r_y2": 252.2,
"r_x3": 328.78,
"r_y3": 252.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3"
},
{
"label": "list_item",
"id": 8,
"page_no": 8,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 263.64,
"r": 545.11,
"b": 326.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.937,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 271.66,
"r_x1": 324.26,
"r_y1": 271.66,
"r_x2": 324.26,
"r_y2": 263.64,
"r_x3": 308.86,
"r_y3": 263.64,
"coord_origin": "TOPLEFT"
},
"text": "[19]",
"orig": "[19]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.58,
"r_y0": 271.66,
"r_x1": 545.11,
"r_y1": 271.66,
"r_x2": 545.11,
"r_y2": 263.64,
"r_x3": 326.58,
"r_y3": 263.64,
"coord_origin": "TOPLEFT"
},
"text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 282.62,
"r_x1": 545.11,
"r_y1": 282.62,
"r_x2": 545.11,
"r_y2": 274.6,
"r_x3": 328.78,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 293.58,
"r_x1": 545.11,
"r_y1": 293.58,
"r_x2": 545.11,
"r_y2": 285.56,
"r_x3": 328.78,
"r_y3": 285.56,
"coord_origin": "TOPLEFT"
},
"text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 304.54,
"r_x1": 545.11,
"r_y1": 304.54,
"r_x2": 545.11,
"r_y2": 296.52,
"r_x3": 328.78,
"r_y3": 296.52,
"coord_origin": "TOPLEFT"
},
"text": "bust pdf document conversion using recurrent neural net-",
"orig": "bust pdf document conversion using recurrent neural net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 315.5,
"r_x1": 352.85,
"r_y1": 315.5,
"r_x2": 352.85,
"r_y2": 307.48,
"r_x3": 328.78,
"r_y3": 307.48,
"coord_origin": "TOPLEFT"
},
"text": "works.",
"orig": "works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.24,
"r_y0": 315.29,
"r_x1": 545.11,
"r_y1": 315.29,
"r_x2": 545.11,
"r_y2": 307.56,
"r_x3": 360.24,
"r_y3": 307.56,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the AAAI Conference on Artificial",
"orig": "Proceedings of the AAAI Conference on Artificial",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 326.25,
"r_x1": 371.02,
"r_y1": 326.25,
"r_x2": 371.02,
"r_y2": 318.52,
"r_x3": 328.78,
"r_y3": 318.52,
"coord_origin": "TOPLEFT"
},
"text": "Intelligence",
"orig": "Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.02,
"r_y0": 326.45,
"r_x1": 502.26,
"r_y1": 326.45,
"r_x2": 502.26,
"r_y2": 318.44,
"r_x3": 371.02,
"r_y3": 318.44,
"coord_origin": "TOPLEFT"
},
"text": ", 35(17):15137-15145, May 2021. 1",
"orig": ", 35(17):15137-15145, May 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1"
},
{
"label": "list_item",
"id": 18,
"page_no": 8,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 329.88,
"r": 545.12,
"b": 370.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.903,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 337.9,
"r_x1": 323.83,
"r_y1": 337.9,
"r_x2": 323.83,
"r_y2": 329.88,
"r_x3": 308.86,
"r_y3": 329.88,
"coord_origin": "TOPLEFT"
},
"text": "[20]",
"orig": "[20]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.07,
"r_y0": 337.9,
"r_x1": 545.11,
"r_y1": 337.9,
"r_x2": 545.11,
"r_y2": 329.88,
"r_x3": 326.07,
"r_y3": 329.88,
"coord_origin": "TOPLEFT"
},
"text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 348.86,
"r_x1": 545.11,
"r_y1": 348.86,
"r_x2": 545.11,
"r_y2": 340.84,
"r_x3": 328.78,
"r_y3": 340.84,
"coord_origin": "TOPLEFT"
},
"text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 359.82,
"r_x1": 382.78,
"r_y1": 359.82,
"r_x2": 382.78,
"r_y2": 351.8,
"r_x3": 328.78,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "in the wild. In",
"orig": "in the wild. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.54,
"r_y0": 359.61,
"r_x1": 545.12,
"r_y1": 359.61,
"r_x2": 545.12,
"r_y2": 351.88,
"r_x3": 385.54,
"r_y3": 351.88,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF International",
"orig": "Proceedings of the IEEE/CVF International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 370.57,
"r_x1": 443.6,
"r_y1": 370.57,
"r_x2": 443.6,
"r_y2": 362.84,
"r_x3": 328.78,
"r_y3": 362.84,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision",
"orig": "Conference on Computer Vision",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 443.59,
"r_y0": 370.78,
"r_x1": 534.49,
"r_y1": 370.78,
"r_x2": 534.49,
"r_y2": 362.76,
"r_x3": 443.59,
"r_y3": 362.76,
"coord_origin": "TOPLEFT"
},
"text": ", pages 944-952, 2021. 2",
"orig": ", pages 944-952, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2"
},
{
"label": "list_item",
"id": 21,
"page_no": 8,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 374.21,
"r": 545.11,
"b": 437.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.883,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 382.22,
"r_x1": 324.6,
"r_y1": 382.22,
"r_x2": 324.6,
"r_y2": 374.21,
"r_x3": 308.86,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "[21]",
"orig": "[21]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.96,
"r_y0": 382.22,
"r_x1": 362.66,
"r_y1": 382.22,
"r_x2": 362.66,
"r_y2": 374.21,
"r_x3": 326.96,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Shubham",
"orig": "Shubham",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.69,
"r_y0": 382.22,
"r_x1": 389.61,
"r_y1": 382.22,
"r_x2": 389.61,
"r_y2": 374.21,
"r_x3": 368.69,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Singh",
"orig": "Singh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 395.65,
"r_y0": 382.22,
"r_x1": 424.56,
"r_y1": 382.22,
"r_x2": 424.56,
"r_y2": 374.21,
"r_x3": 395.65,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Paliwal,",
"orig": "Paliwal,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.55,
"r_y0": 382.22,
"r_x1": 438.02,
"r_y1": 382.22,
"r_x2": 438.02,
"r_y2": 374.21,
"r_x3": 431.55,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "D",
"orig": "D",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.06,
"r_y0": 382.22,
"r_x1": 488.5,
"r_y1": 382.22,
"r_x2": 488.5,
"r_y2": 374.21,
"r_x3": 444.06,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Vishwanath,",
"orig": "Vishwanath,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.48,
"r_y0": 382.22,
"r_x1": 515.41,
"r_y1": 382.22,
"r_x2": 515.41,
"r_y2": 374.21,
"r_x3": 495.48,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Rohit",
"orig": "Rohit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 521.45,
"r_y0": 382.22,
"r_x1": 545.11,
"r_y1": 382.22,
"r_x2": 545.11,
"r_y2": 374.21,
"r_x3": 521.45,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Rahul,",
"orig": "Rahul,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 393.18,
"r_x1": 545.11,
"r_y1": 393.18,
"r_x2": 545.11,
"r_y2": 385.17,
"r_x3": 328.78,
"r_y3": 385.17,
"coord_origin": "TOPLEFT"
},
"text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 404.14,
"r_x1": 545.11,
"r_y1": 404.14,
"r_x2": 545.11,
"r_y2": 396.12,
"r_x3": 328.78,
"r_y3": 396.12,
"coord_origin": "TOPLEFT"
},
"text": "ing model for end-to-end table detection and tabular data ex-",
"orig": "ing model for end-to-end table detection and tabular data ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 415.1,
"r_x1": 478.01,
"r_y1": 415.1,
"r_x2": 478.01,
"r_y2": 407.08,
"r_x3": 328.78,
"r_y3": 407.08,
"coord_origin": "TOPLEFT"
},
"text": "traction from scanned document images.",
"orig": "traction from scanned document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 484.07,
"r_y0": 415.1,
"r_x1": 491.54,
"r_y1": 415.1,
"r_x2": 491.54,
"r_y2": 407.08,
"r_x3": 484.07,
"r_y3": 407.08,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.67,
"r_y0": 414.89,
"r_x1": 545.11,
"r_y1": 414.89,
"r_x2": 545.11,
"r_y2": 407.16,
"r_x3": 494.67,
"r_y3": 407.16,
"coord_origin": "TOPLEFT"
},
"text": "2019 Interna-",
"orig": "2019 Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 425.85,
"r_x1": 545.11,
"r_y1": 425.85,
"r_x2": 545.11,
"r_y2": 418.12,
"r_x3": 328.78,
"r_y3": 418.12,
"coord_origin": "TOPLEFT"
},
"text": "tional Conference on Document Analysis and Recognition",
"orig": "tional Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 436.81,
"r_x1": 360.84,
"r_y1": 436.81,
"r_x2": 360.84,
"r_y2": 429.08,
"r_x3": 328.78,
"r_y3": 429.08,
"coord_origin": "TOPLEFT"
},
"text": "(ICDAR)",
"orig": "(ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.84,
"r_y0": 437.02,
"r_x1": 475.63,
"r_y1": 437.02,
"r_x2": 475.63,
"r_y2": 429.0,
"r_x3": 360.84,
"r_y3": 429.0,
"coord_origin": "TOPLEFT"
},
"text": ", pages 128-133. IEEE, 2019. 1",
"orig": ", pages 128-133. IEEE, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1"
},
{
"label": "list_item",
"id": 20,
"page_no": 8,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 440.45,
"r": 545.11,
"b": 558.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.46,
"r_x1": 324.57,
"r_y1": 448.46,
"r_x2": 324.57,
"r_y2": 440.45,
"r_x3": 308.86,
"r_y3": 440.45,
"coord_origin": "TOPLEFT"
},
"text": "[22]",
"orig": "[22]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.93,
"r_y0": 448.46,
"r_x1": 545.11,
"r_y1": 448.46,
"r_x2": 545.11,
"r_y2": 440.45,
"r_x3": 326.93,
"r_y3": 440.45,
"coord_origin": "TOPLEFT"
},
"text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 459.42,
"r_x1": 545.11,
"r_y1": 459.42,
"r_x2": 545.11,
"r_y2": 451.41,
"r_x3": 328.78,
"r_y3": 451.41,
"coord_origin": "TOPLEFT"
},
"text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 470.38,
"r_x1": 545.11,
"r_y1": 470.38,
"r_x2": 545.11,
"r_y2": 462.36,
"r_x3": 328.78,
"r_y3": 462.36,
"coord_origin": "TOPLEFT"
},
"text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 481.34,
"r_x1": 545.11,
"r_y1": 481.34,
"r_x2": 545.11,
"r_y2": 473.32,
"r_x3": 328.78,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 492.3,
"r_x1": 545.11,
"r_y1": 492.3,
"r_x2": 545.11,
"r_y2": 484.28,
"r_x3": 328.78,
"r_y3": 484.28,
"coord_origin": "TOPLEFT"
},
"text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 503.26,
"r_x1": 545.11,
"r_y1": 503.26,
"r_x2": 545.11,
"r_y2": 495.24,
"r_x3": 328.78,
"r_y3": 495.24,
"coord_origin": "TOPLEFT"
},
"text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 514.22,
"r_x1": 545.11,
"r_y1": 514.22,
"r_x2": 545.11,
"r_y2": 506.2,
"r_x3": 328.78,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "perative style, high-performance deep learning library. In H.",
"orig": "perative style, high-performance deep learning library. In H.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 525.17,
"r_x1": 545.11,
"r_y1": 525.17,
"r_x2": 545.11,
"r_y2": 517.16,
"r_x3": 328.78,
"r_y3": 517.16,
"coord_origin": "TOPLEFT"
},
"text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 536.13,
"r_x1": 434.57,
"r_y1": 536.13,
"r_x2": 434.57,
"r_y2": 528.12,
"r_x3": 328.78,
"r_y3": 528.12,
"coord_origin": "TOPLEFT"
},
"text": "Fox, and R. Garnett, editors,",
"orig": "Fox, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.86,
"r_y0": 535.93,
"r_x1": 545.11,
"r_y1": 535.93,
"r_x2": 545.11,
"r_y2": 528.2,
"r_x3": 437.86,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural Informa-",
"orig": "Advances in Neural Informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 546.89,
"r_x1": 425.73,
"r_y1": 546.89,
"r_x2": 425.73,
"r_y2": 539.16,
"r_x3": 328.78,
"r_y3": 539.16,
"coord_origin": "TOPLEFT"
},
"text": "tion Processing Systems 32",
"orig": "tion Processing Systems 32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 425.74,
"r_y0": 547.09,
"r_x1": 545.11,
"r_y1": 547.09,
"r_x2": 545.11,
"r_y2": 539.08,
"r_x3": 425.74,
"r_y3": 539.08,
"coord_origin": "TOPLEFT"
},
"text": ", pages 8024-8035. Curran Asso-",
"orig": ", pages 8024-8035. Curran Asso-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 558.05,
"r_x1": 399.74,
"r_y1": 558.05,
"r_x2": 399.74,
"r_y2": 550.03,
"r_x3": 328.78,
"r_y3": 550.03,
"coord_origin": "TOPLEFT"
},
"text": "ciates, Inc., 2019. 6",
"orig": "ciates, Inc., 2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E. Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6"
},
{
"label": "list_item",
"id": 19,
"page_no": 8,
"cluster": {
"id": 19,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 561.48,
"r": 545.11,
"b": 624.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.903,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.5,
"r_x1": 324.5,
"r_y1": 569.5,
"r_x2": 324.5,
"r_y2": 561.48,
"r_x3": 308.86,
"r_y3": 561.48,
"coord_origin": "TOPLEFT"
},
"text": "[23]",
"orig": "[23]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.85,
"r_y0": 569.5,
"r_x1": 545.11,
"r_y1": 569.5,
"r_x2": 545.11,
"r_y2": 561.48,
"r_x3": 326.85,
"r_y3": 561.48,
"coord_origin": "TOPLEFT"
},
"text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 580.46,
"r_x1": 545.11,
"r_y1": 580.46,
"r_x2": 545.11,
"r_y2": 572.44,
"r_x3": 328.78,
"r_y3": 572.44,
"coord_origin": "TOPLEFT"
},
"text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 591.41,
"r_x1": 545.11,
"r_y1": 591.41,
"r_x2": 545.11,
"r_y2": 583.4,
"r_x3": 328.78,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "for end to end table detection and structure recognition from",
"orig": "for end to end table detection and structure recognition from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 602.37,
"r_x1": 431.62,
"r_y1": 602.37,
"r_x2": 431.62,
"r_y2": 594.36,
"r_x3": 328.78,
"r_y3": 594.36,
"coord_origin": "TOPLEFT"
},
"text": "image-based documents. In",
"orig": "image-based documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.69,
"r_y0": 602.17,
"r_x1": 545.11,
"r_y1": 602.17,
"r_x2": 545.11,
"r_y2": 594.44,
"r_x3": 434.69,
"r_y3": 594.44,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF",
"orig": "Proceedings of the IEEE/CVF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 613.13,
"r_x1": 545.11,
"r_y1": 613.13,
"r_x2": 545.11,
"r_y2": 605.4,
"r_x3": 328.78,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision and Pattern Recognition",
"orig": "Conference on Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 624.08,
"r_x1": 367.8,
"r_y1": 624.08,
"r_x2": 367.8,
"r_y2": 616.36,
"r_x3": 328.78,
"r_y3": 616.36,
"coord_origin": "TOPLEFT"
},
"text": "Workshops",
"orig": "Workshops",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.8,
"r_y0": 624.29,
"r_x1": 458.69,
"r_y1": 624.29,
"r_x2": 458.69,
"r_y2": 616.28,
"r_x3": 367.8,
"r_y3": 616.28,
"coord_origin": "TOPLEFT"
},
"text": ", pages 572-573, 2020. 1",
"orig": ", pages 572-573, 2020. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1"
},
{
"label": "list_item",
"id": 23,
"page_no": 8,
"cluster": {
"id": 23,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 627.72,
"r": 545.12,
"b": 668.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.878,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 635.74,
"r_x1": 324.69,
"r_y1": 635.74,
"r_x2": 324.69,
"r_y2": 627.72,
"r_x3": 308.86,
"r_y3": 627.72,
"coord_origin": "TOPLEFT"
},
"text": "[24]",
"orig": "[24]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.07,
"r_y0": 635.74,
"r_x1": 545.11,
"r_y1": 635.74,
"r_x2": 545.11,
"r_y2": 627.72,
"r_x3": 327.07,
"r_y3": 627.72,
"coord_origin": "TOPLEFT"
},
"text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 646.7,
"r_x1": 545.11,
"r_y1": 646.7,
"r_x2": 545.11,
"r_y2": 638.68,
"r_x3": 328.78,
"r_y3": 638.68,
"coord_origin": "TOPLEFT"
},
"text": "Rethinking table recognition using graph neural networks.",
"orig": "Rethinking table recognition using graph neural networks.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 657.65,
"r_x1": 336.25,
"r_y1": 657.65,
"r_x2": 336.25,
"r_y2": 649.64,
"r_x3": 328.78,
"r_y3": 649.64,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 338.1,
"r_y0": 657.45,
"r_x1": 545.12,
"r_y1": 657.45,
"r_x2": 545.12,
"r_y2": 649.72,
"r_x3": 338.1,
"r_y3": 649.72,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 668.41,
"r_x1": 406.32,
"r_y1": 668.41,
"r_x2": 406.32,
"r_y2": 660.68,
"r_x3": 328.78,
"r_y3": 660.68,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.32,
"r_y0": 668.61,
"r_x1": 521.12,
"r_y1": 668.61,
"r_x2": 521.12,
"r_y2": 660.6,
"r_x3": 406.32,
"r_y3": 660.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 142-147. IEEE, 2019. 3",
"orig": ", pages 142-147. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 24,
"page_no": 8,
"cluster": {
"id": 24,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 672.04,
"r": 545.11,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.865,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 680.06,
"r_x1": 324.71,
"r_y1": 680.06,
"r_x2": 324.71,
"r_y2": 672.04,
"r_x3": 308.86,
"r_y3": 672.04,
"coord_origin": "TOPLEFT"
},
"text": "[25]",
"orig": "[25]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.09,
"r_y0": 680.06,
"r_x1": 545.11,
"r_y1": 680.06,
"r_x2": 545.11,
"r_y2": 672.04,
"r_x3": 327.09,
"r_y3": 672.04,
"coord_origin": "TOPLEFT"
},
"text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 691.02,
"r_x1": 482.81,
"r_y1": 691.02,
"r_x2": 482.81,
"r_y2": 683.0,
"r_x3": 328.78,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Sadeghian, Ian Reid, and Silvio Savarese.",
"orig": "Sadeghian, Ian Reid, and Silvio Savarese.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.75,
"r_y0": 691.02,
"r_x1": 545.11,
"r_y1": 691.02,
"r_x2": 545.11,
"r_y2": 683.0,
"r_x3": 488.75,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Generalized in-",
"orig": "Generalized in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 701.98,
"r_x1": 545.11,
"r_y1": 701.98,
"r_x2": 545.11,
"r_y2": 693.96,
"r_x3": 328.78,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "tersection over union: A metric and a loss for bounding box",
"orig": "tersection over union: A metric and a loss for bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 712.94,
"r_x1": 379.15,
"r_y1": 712.94,
"r_x2": 379.15,
"r_y2": 704.92,
"r_x3": 328.78,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "regression. In",
"orig": "regression. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 381.62,
"r_y0": 712.73,
"r_x1": 545.11,
"r_y1": 712.73,
"r_x2": 545.11,
"r_y2": 705.0,
"r_x3": 381.62,
"r_y3": 705.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF Conference on",
"orig": "Proceedings of the IEEE/CVF Conference on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on"
},
{
"label": "page_footer",
"id": 22,
"page_no": 8,
"cluster": {
"id": 22,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9"
}
],
"body": [
{
"label": "list_item",
"id": 25,
"page_no": 8,
"cluster": {
"id": 25,
"label": "list_item",
"bbox": {
"l": 70.03,
"t": 75.88,
"r": 286.36,
"b": 116.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.731,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 83.9,
"r_x1": 286.36,
"r_y1": 83.9,
"r_x2": 286.36,
"r_y2": 75.88,
"r_x3": 70.03,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "end object detection with transformers. In Andrea Vedaldi,",
"orig": "end object detection with transformers. In Andrea Vedaldi,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 94.86,
"r_x1": 286.36,
"r_y1": 94.86,
"r_x2": 286.36,
"r_y2": 86.84,
"r_x3": 70.03,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 105.82,
"r_x1": 85.72,
"r_y1": 105.82,
"r_x2": 85.72,
"r_y2": 97.8,
"r_x3": 70.03,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "tors,",
"orig": "tors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 87.89,
"r_y0": 105.61,
"r_x1": 199.93,
"r_y1": 105.61,
"r_x2": 199.93,
"r_y2": 97.88,
"r_x3": 87.89,
"r_y3": 97.88,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision - ECCV 2020",
"orig": "Computer Vision - ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.94,
"r_y0": 105.82,
"r_x1": 286.36,
"r_y1": 105.82,
"r_x2": 286.36,
"r_y2": 97.8,
"r_x3": 199.94,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 213-229, Cham,",
"orig": ", pages 213-229, Cham,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 116.78,
"r_x1": 221.95,
"r_y1": 116.78,
"r_x2": 221.95,
"r_y2": 108.76,
"r_x3": 70.03,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "2020. Springer International Publishing. 5",
"orig": "2020. Springer International Publishing. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5"
},
{
"label": "list_item",
"id": 9,
"page_no": 8,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 120.03,
"r": 286.36,
"b": 149.97,
"coord_origin": "TOPLEFT"
},
"confidence": 0.937,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 128.05,
"r_x1": 65.21,
"r_y1": 128.05,
"r_x2": 65.21,
"r_y2": 120.03,
"r_x3": 54.6,
"r_y3": 120.03,
"coord_origin": "TOPLEFT"
},
"text": "[2]",
"orig": "[2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.48,
"r_y0": 128.05,
"r_x1": 286.36,
"r_y1": 128.05,
"r_x2": 286.36,
"r_y2": 120.03,
"r_x3": 67.48,
"r_y3": 120.03,
"coord_origin": "TOPLEFT"
},
"text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 139.01,
"r_x1": 179.67,
"r_y1": 139.01,
"r_x2": 179.67,
"r_y2": 130.99,
"r_x3": 70.03,
"r_y3": 130.99,
"coord_origin": "TOPLEFT"
},
"text": "uan Yin, and Xian-Ling Mao.",
"orig": "uan Yin, and Xian-Ling Mao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.58,
"r_y0": 139.01,
"r_x1": 286.36,
"r_y1": 139.01,
"r_x2": 286.36,
"r_y2": 130.99,
"r_x3": 185.58,
"r_y3": 130.99,
"coord_origin": "TOPLEFT"
},
"text": "Complicated table structure",
"orig": "Complicated table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 149.97,
"r_x1": 113.11,
"r_y1": 149.97,
"r_x2": 113.11,
"r_y2": 141.95,
"r_x3": 70.03,
"r_y3": 141.95,
"coord_origin": "TOPLEFT"
},
"text": "recognition.",
"orig": "recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.34,
"r_y0": 149.76,
"r_x1": 235.31,
"r_y1": 149.76,
"r_x2": 235.31,
"r_y2": 142.03,
"r_x3": 116.34,
"r_y3": 142.03,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint arXiv:1908.04729",
"orig": "arXiv preprint arXiv:1908.04729",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 235.31,
"r_y0": 149.97,
"r_x1": 267.68,
"r_y1": 149.97,
"r_x2": 267.68,
"r_y2": 141.95,
"r_x3": 235.31,
"r_y3": 141.95,
"coord_origin": "TOPLEFT"
},
"text": ", 2019. 3",
"orig": ", 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3"
},
{
"label": "list_item",
"id": 7,
"page_no": 8,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 153.22,
"r": 286.36,
"b": 183.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.938,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 161.24,
"r_x1": 65.1,
"r_y1": 161.24,
"r_x2": 65.1,
"r_y2": 153.22,
"r_x3": 54.6,
"r_y3": 153.22,
"coord_origin": "TOPLEFT"
},
"text": "[3]",
"orig": "[3]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.36,
"r_y0": 161.24,
"r_x1": 218.78,
"r_y1": 161.24,
"r_x2": 218.78,
"r_y2": 153.22,
"r_x3": 67.36,
"r_y3": 153.22,
"coord_origin": "TOPLEFT"
},
"text": "Bertrand Couasnon and Aurelie Lemaitre.",
"orig": "Bertrand Couasnon and Aurelie Lemaitre.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.98,
"r_y0": 161.03,
"r_x1": 286.36,
"r_y1": 161.03,
"r_x2": 286.36,
"r_y2": 153.3,
"r_x3": 220.98,
"r_y3": 153.3,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of Ta-",
"orig": "Recognition of Ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 171.99,
"r_x1": 125.26,
"r_y1": 171.99,
"r_x2": 125.26,
"r_y2": 164.26,
"r_x3": 70.03,
"r_y3": 164.26,
"coord_origin": "TOPLEFT"
},
"text": "bles and Forms",
"orig": "bles and Forms",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.26,
"r_y0": 172.2,
"r_x1": 286.36,
"r_y1": 172.2,
"r_x2": 286.36,
"r_y2": 164.18,
"r_x3": 125.26,
"r_y3": 164.18,
"coord_origin": "TOPLEFT"
},
"text": ", pages 647-677. Springer London, London,",
"orig": ", pages 647-677. Springer London, London,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 183.15,
"r_x1": 97.92,
"r_y1": 183.15,
"r_x2": 97.92,
"r_y2": 175.14,
"r_x3": 70.03,
"r_y3": 175.14,
"coord_origin": "TOPLEFT"
},
"text": "2014. 2",
"orig": "2014. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2"
},
{
"label": "list_item",
"id": 0,
"page_no": 8,
"cluster": {
"id": 0,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 186.41,
"r": 286.36,
"b": 227.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.965,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 194.43,
"r_x1": 65.81,
"r_y1": 194.43,
"r_x2": 65.81,
"r_y2": 186.41,
"r_x3": 54.59,
"r_y3": 186.41,
"coord_origin": "TOPLEFT"
},
"text": "[4]",
"orig": "[4]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.21,
"r_y0": 194.43,
"r_x1": 286.36,
"r_y1": 194.43,
"r_x2": 286.36,
"r_y2": 186.41,
"r_x3": 68.21,
"r_y3": 186.41,
"coord_origin": "TOPLEFT"
},
"text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 205.39,
"r_x1": 286.36,
"r_y1": 205.39,
"r_x2": 286.36,
"r_y2": 197.37,
"r_x3": 70.03,
"r_y3": 197.37,
"coord_origin": "TOPLEFT"
},
"text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 216.34,
"r_x1": 286.36,
"r_y1": 216.34,
"r_x2": 286.36,
"r_y2": 208.33,
"r_x3": 70.03,
"r_y3": 208.33,
"coord_origin": "TOPLEFT"
},
"text": "DAR 2019 Competition on Table Detection and Recognition",
"orig": "DAR 2019 Competition on Table Detection and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 227.3,
"r_x1": 245.84,
"r_y1": 227.3,
"r_x2": 245.84,
"r_y2": 219.29,
"r_x3": 70.03,
"r_y3": 219.29,
"coord_origin": "TOPLEFT"
},
"text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[4] Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2"
},
{
"label": "list_item",
"id": 1,
"page_no": 8,
"cluster": {
"id": 1,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 230.56,
"r": 286.36,
"b": 271.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 238.58,
"r_x1": 65.38,
"r_y1": 238.58,
"r_x2": 65.38,
"r_y2": 230.56,
"r_x3": 54.59,
"r_y3": 230.56,
"coord_origin": "TOPLEFT"
},
"text": "[5]",
"orig": "[5]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.69,
"r_y0": 238.58,
"r_x1": 286.36,
"r_y1": 238.58,
"r_x2": 286.36,
"r_y2": 230.56,
"r_x3": 67.69,
"r_y3": 230.56,
"coord_origin": "TOPLEFT"
},
"text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 249.53,
"r_x1": 286.36,
"r_y1": 249.53,
"r_x2": 286.36,
"r_y2": 241.52,
"r_x3": 70.03,
"r_y3": 241.52,
"coord_origin": "TOPLEFT"
},
"text": "Stavros J Perantonis. Automatic table detection in document",
"orig": "Stavros J Perantonis. Automatic table detection in document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 260.49,
"r_x1": 108.4,
"r_y1": 260.49,
"r_x2": 108.4,
"r_y2": 252.48,
"r_x3": 70.03,
"r_y3": 252.48,
"coord_origin": "TOPLEFT"
},
"text": "images. In",
"orig": "images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.64,
"r_y0": 260.29,
"r_x1": 286.36,
"r_y1": 260.29,
"r_x2": 286.36,
"r_y2": 252.56,
"r_x3": 110.64,
"r_y3": 252.56,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Pattern Recognition",
"orig": "International Conference on Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 271.25,
"r_x1": 140.58,
"r_y1": 271.25,
"r_x2": 140.58,
"r_y2": 263.52,
"r_x3": 70.03,
"r_y3": 263.52,
"coord_origin": "TOPLEFT"
},
"text": "and Image Analysis",
"orig": "and Image Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.58,
"r_y0": 271.45,
"r_x1": 266.48,
"r_y1": 271.45,
"r_x2": 266.48,
"r_y2": 263.44,
"r_x3": 140.58,
"r_y3": 263.44,
"coord_origin": "TOPLEFT"
},
"text": ", pages 609-618. Springer, 2005. 2",
"orig": ", pages 609-618. Springer, 2005. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2"
},
{
"label": "list_item",
"id": 2,
"page_no": 8,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 274.71,
"r": 286.37,
"b": 315.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 282.72,
"r_x1": 64.85,
"r_y1": 282.72,
"r_x2": 64.85,
"r_y2": 274.71,
"r_x3": 54.59,
"r_y3": 274.71,
"coord_origin": "TOPLEFT"
},
"text": "[6]",
"orig": "[6]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.05,
"r_y0": 282.72,
"r_x1": 286.37,
"r_y1": 282.72,
"r_x2": 286.37,
"r_y2": 274.71,
"r_x3": 67.05,
"r_y3": 274.71,
"coord_origin": "TOPLEFT"
},
"text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 293.68,
"r_x1": 179.57,
"r_y1": 293.68,
"r_x2": 179.57,
"r_y2": 285.67,
"r_x3": 70.03,
"r_y3": 285.67,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2013 table competition.",
"orig": "Icdar 2013 table competition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.02,
"r_y0": 293.68,
"r_x1": 194.48,
"r_y1": 293.68,
"r_x2": 194.48,
"r_y2": 285.67,
"r_x3": 187.02,
"r_y3": 285.67,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.04,
"r_y0": 293.48,
"r_x1": 286.36,
"r_y1": 293.48,
"r_x2": 286.36,
"r_y2": 285.75,
"r_x3": 198.04,
"r_y3": 285.75,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International",
"orig": "2013 12th International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 304.44,
"r_x1": 260.2,
"r_y1": 304.44,
"r_x2": 260.2,
"r_y2": 296.71,
"r_x3": 70.03,
"r_y3": 296.71,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition",
"orig": "Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.2,
"r_y0": 304.64,
"r_x1": 286.36,
"r_y1": 304.64,
"r_x2": 286.36,
"r_y2": 296.63,
"r_x3": 260.2,
"r_y3": 296.63,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 315.6,
"r_x1": 142.75,
"r_y1": 315.6,
"r_x2": 142.75,
"r_y2": 307.58,
"r_x3": 70.03,
"r_y3": 307.58,
"coord_origin": "TOPLEFT"
},
"text": "1449-1453, 2013. 2",
"orig": "1449-1453, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[6] Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2"
},
{
"label": "list_item",
"id": 4,
"page_no": 8,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 318.86,
"r": 286.36,
"b": 348.79,
"coord_origin": "TOPLEFT"
},
"confidence": 0.948,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 326.87,
"r_x1": 65.62,
"r_y1": 326.87,
"r_x2": 65.62,
"r_y2": 318.86,
"r_x3": 54.59,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "[7]",
"orig": "[7]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.98,
"r_y0": 326.87,
"r_x1": 199.49,
"r_y1": 326.87,
"r_x2": 199.49,
"r_y2": 318.86,
"r_x3": 67.98,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "EA Green and M Krishnamoorthy.",
"orig": "EA Green and M Krishnamoorthy.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.99,
"r_y0": 326.87,
"r_x1": 286.36,
"r_y1": 326.87,
"r_x2": 286.36,
"r_y2": 318.86,
"r_x3": 206.99,
"r_y3": 318.86,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of tables",
"orig": "Recognition of tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 337.83,
"r_x1": 176.28,
"r_y1": 337.83,
"r_x2": 176.28,
"r_y2": 329.81,
"r_x3": 70.03,
"r_y3": 329.81,
"coord_origin": "TOPLEFT"
},
"text": "using table grammars. procs.",
"orig": "using table grammars. procs.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 337.83,
"r_x1": 190.07,
"r_y1": 337.83,
"r_x2": 190.07,
"r_y2": 329.81,
"r_x3": 182.6,
"r_y3": 329.81,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 193.28,
"r_y0": 337.62,
"r_x1": 286.36,
"r_y1": 337.62,
"r_x2": 286.36,
"r_y2": 329.9,
"r_x3": 193.28,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Symposium on Document",
"orig": "Symposium on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 348.58,
"r_x1": 206.35,
"r_y1": 348.58,
"r_x2": 206.35,
"r_y2": 340.85,
"r_x3": 70.03,
"r_y3": 340.85,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (SDAIR\u201995)",
"orig": "Analysis and Recognition (SDAIR\u201995)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.35,
"r_y0": 348.79,
"r_x1": 274.82,
"r_y1": 348.79,
"r_x2": 274.82,
"r_y2": 340.77,
"r_x3": 206.35,
"r_y3": 340.77,
"coord_origin": "TOPLEFT"
},
"text": ", pages 261-277. 2",
"orig": ", pages 261-277. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2"
},
{
"label": "list_item",
"id": 3,
"page_no": 8,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 54.59,
"t": 352.05,
"r": 286.36,
"b": 403.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.948,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.59,
"r_y0": 360.06,
"r_x1": 65.05,
"r_y1": 360.06,
"r_x2": 65.05,
"r_y2": 352.05,
"r_x3": 54.59,
"r_y3": 352.05,
"coord_origin": "TOPLEFT"
},
"text": "[8]",
"orig": "[8]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.29,
"r_y0": 360.06,
"r_x1": 286.36,
"r_y1": 360.06,
"r_x2": 286.36,
"r_y2": 352.05,
"r_x3": 67.29,
"r_y3": 352.05,
"coord_origin": "TOPLEFT"
},
"text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 371.02,
"r_x1": 234.13,
"r_y1": 371.02,
"r_x2": 234.13,
"r_y2": 363.0,
"r_x3": 70.03,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "dier Stricker, and Muhammad Zeshan Afzal.",
"orig": "dier Stricker, and Muhammad Zeshan Afzal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.05,
"r_y0": 371.02,
"r_x1": 286.36,
"r_y1": 371.02,
"r_x2": 286.36,
"r_y2": 363.0,
"r_x3": 240.05,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "Castabdetec-",
"orig": "Castabdetec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 381.98,
"r_x1": 286.36,
"r_y1": 381.98,
"r_x2": 286.36,
"r_y2": 373.96,
"r_x3": 70.03,
"r_y3": 373.96,
"coord_origin": "TOPLEFT"
},
"text": "tors: Cascade network for table detection in document im-",
"orig": "tors: Cascade network for table detection in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 392.94,
"r_x1": 286.36,
"r_y1": 392.94,
"r_x2": 286.36,
"r_y2": 384.92,
"r_x3": 70.03,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "ages with recursive feature pyramid and switchable atrous",
"orig": "ages with recursive feature pyramid and switchable atrous",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 403.9,
"r_x1": 114.58,
"r_y1": 403.9,
"r_x2": 114.58,
"r_y2": 395.88,
"r_x3": 70.03,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": "convolution.",
"orig": "convolution.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.8,
"r_y0": 403.69,
"r_x1": 186.73,
"r_y1": 403.69,
"r_x2": 186.73,
"r_y2": 395.96,
"r_x3": 117.8,
"r_y3": 395.96,
"coord_origin": "TOPLEFT"
},
"text": "Journal of Imaging",
"orig": "Journal of Imaging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 186.73,
"r_y0": 403.9,
"r_x1": 243.0,
"r_y1": 403.9,
"r_x2": 243.0,
"r_y2": 395.88,
"r_x3": 186.73,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": ", 7(10), 2021. 1",
"orig": ", 7(10), 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1"
},
{
"label": "list_item",
"id": 10,
"page_no": 8,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 407.15,
"r": 286.36,
"b": 437.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.933,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 415.17,
"r_x1": 65.33,
"r_y1": 415.17,
"r_x2": 65.33,
"r_y2": 407.15,
"r_x3": 54.6,
"r_y3": 407.15,
"coord_origin": "TOPLEFT"
},
"text": "[9]",
"orig": "[9]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.64,
"r_y0": 415.17,
"r_x1": 286.36,
"r_y1": 415.17,
"r_x2": 286.36,
"r_y2": 407.15,
"r_x3": 67.64,
"r_y3": 407.15,
"coord_origin": "TOPLEFT"
},
"text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 426.13,
"r_x1": 147.13,
"r_y1": 426.13,
"r_x2": 147.13,
"r_y2": 418.11,
"r_x3": 70.03,
"r_y3": 418.11,
"coord_origin": "TOPLEFT"
},
"text": "shick. Mask r-cnn. In",
"orig": "shick. Mask r-cnn. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.16,
"r_y0": 425.92,
"r_x1": 286.36,
"r_y1": 425.92,
"r_x2": 286.36,
"r_y2": 418.19,
"r_x3": 149.16,
"r_y3": 418.19,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE International",
"orig": "Proceedings of the IEEE International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 436.88,
"r_x1": 213.48,
"r_y1": 436.88,
"r_x2": 213.48,
"r_y2": 429.15,
"r_x3": 70.03,
"r_y3": 429.15,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision (ICCV)",
"orig": "Conference on Computer Vision (ICCV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.48,
"r_y0": 437.09,
"r_x1": 261.04,
"r_y1": 437.09,
"r_x2": 261.04,
"r_y2": 429.07,
"r_x3": 213.48,
"r_y3": 429.07,
"coord_origin": "TOPLEFT"
},
"text": ", Oct 2017. 1",
"orig": ", Oct 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1"
},
{
"label": "list_item",
"id": 14,
"page_no": 8,
"cluster": {
"id": 14,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 440.34,
"r": 286.36,
"b": 481.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.927,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 448.36,
"r_x1": 65.4,
"r_y1": 448.36,
"r_x2": 65.4,
"r_y2": 440.34,
"r_x3": 50.11,
"r_y3": 440.34,
"coord_origin": "TOPLEFT"
},
"text": "[10]",
"orig": "[10]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.69,
"r_y0": 448.36,
"r_x1": 286.36,
"r_y1": 448.36,
"r_x2": 286.36,
"r_y2": 440.34,
"r_x3": 67.69,
"r_y3": 440.34,
"coord_origin": "TOPLEFT"
},
"text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 459.32,
"r_x1": 202.74,
"r_y1": 459.32,
"r_x2": 202.74,
"r_y2": 451.3,
"r_x3": 70.03,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "cong Li, Xin Tang, and Rong Xiao.",
"orig": "cong Li, Xin Tang, and Rong Xiao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 459.32,
"r_x1": 286.36,
"r_y1": 459.32,
"r_x2": 286.36,
"r_y2": 451.3,
"r_x3": 209.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "Pingan-vcgroup\u2019s so-",
"orig": "Pingan-vcgroup\u2019s so-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 470.28,
"r_x1": 286.36,
"r_y1": 470.28,
"r_x2": 286.36,
"r_y2": 462.26,
"r_x3": 70.03,
"r_y3": 462.26,
"coord_origin": "TOPLEFT"
},
"text": "lution for icdar 2021 competition on scientific table image",
"orig": "lution for icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 481.24,
"r_x1": 141.87,
"r_y1": 481.24,
"r_x2": 141.87,
"r_y2": 473.22,
"r_x3": 70.03,
"r_y3": 473.22,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex.",
"orig": "recognition to latex.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.1,
"r_y0": 481.03,
"r_x1": 166.02,
"r_y1": 481.03,
"r_x2": 166.02,
"r_y2": 473.3,
"r_x3": 145.1,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "ArXiv",
"orig": "ArXiv",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 166.01,
"r_y0": 481.24,
"r_x1": 259.9,
"r_y1": 481.24,
"r_x2": 259.9,
"r_y2": 473.22,
"r_x3": 166.01,
"r_y3": 473.22,
"coord_origin": "TOPLEFT"
},
"text": ", abs/2105.01846, 2021. 2",
"orig": ", abs/2105.01846, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2"
},
{
"label": "list_item",
"id": 11,
"page_no": 8,
"cluster": {
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 484.49,
"r": 286.36,
"b": 536.34,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 492.51,
"r_x1": 66.03,
"r_y1": 492.51,
"r_x2": 66.03,
"r_y2": 484.49,
"r_x3": 50.11,
"r_y3": 484.49,
"coord_origin": "TOPLEFT"
},
"text": "[11]",
"orig": "[11]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.42,
"r_y0": 492.51,
"r_x1": 286.36,
"r_y1": 492.51,
"r_x2": 286.36,
"r_y2": 484.49,
"r_x3": 68.42,
"r_y3": 484.49,
"coord_origin": "TOPLEFT"
},
"text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 503.47,
"r_x1": 286.36,
"r_y1": 503.47,
"r_x2": 286.36,
"r_y2": 495.45,
"r_x3": 70.03,
"r_y3": 495.45,
"coord_origin": "TOPLEFT"
},
"text": "Gordon Wilfong. Medium-independent table detection. In",
"orig": "Gordon Wilfong. Medium-independent table detection. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 514.22,
"r_x1": 227.41,
"r_y1": 514.22,
"r_x2": 227.41,
"r_y2": 506.49,
"r_x3": 70.03,
"r_y3": 506.49,
"coord_origin": "TOPLEFT"
},
"text": "Document Recognition and Retrieval VII",
"orig": "Document Recognition and Retrieval VII",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.41,
"r_y0": 514.42,
"r_x1": 286.36,
"r_y1": 514.42,
"r_x2": 286.36,
"r_y2": 506.41,
"r_x3": 227.41,
"r_y3": 506.41,
"coord_origin": "TOPLEFT"
},
"text": ", volume 3967,",
"orig": ", volume 3967,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 525.38,
"r_x1": 286.36,
"r_y1": 525.38,
"r_x2": 286.36,
"r_y2": 517.37,
"r_x3": 70.03,
"r_y3": 517.37,
"coord_origin": "TOPLEFT"
},
"text": "pages 291-302. International Society for Optics and Photon-",
"orig": "pages 291-302. International Society for Optics and Photon-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 536.34,
"r_x1": 112.36,
"r_y1": 536.34,
"r_x2": 112.36,
"r_y2": 528.33,
"r_x3": 70.03,
"r_y3": 528.33,
"coord_origin": "TOPLEFT"
},
"text": "ics, 1999. 2",
"orig": "ics, 1999. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2"
},
{
"label": "list_item",
"id": 5,
"page_no": 8,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 539.6,
"r": 286.36,
"b": 591.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 547.61,
"r_x1": 65.47,
"r_y1": 547.61,
"r_x2": 65.47,
"r_y2": 539.6,
"r_x3": 50.11,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "[12]",
"orig": "[12]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 547.61,
"r_x1": 286.36,
"r_y1": 547.61,
"r_x2": 286.36,
"r_y2": 539.6,
"r_x3": 67.77,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "Matthew Hurst. A constraint-based approach to table struc-",
"orig": "Matthew Hurst. A constraint-based approach to table struc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 558.57,
"r_x1": 136.28,
"r_y1": 558.57,
"r_x2": 136.28,
"r_y2": 550.56,
"r_x3": 70.03,
"r_y3": 550.56,
"coord_origin": "TOPLEFT"
},
"text": "ture derivation. In",
"orig": "ture derivation. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.81,
"r_y0": 558.37,
"r_x1": 286.36,
"r_y1": 558.37,
"r_x2": 286.36,
"r_y2": 550.64,
"r_x3": 138.81,
"r_y3": 550.64,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the Seventh International",
"orig": "Proceedings of the Seventh International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 569.33,
"r_x1": 286.36,
"r_y1": 569.33,
"r_x2": 286.36,
"r_y2": 561.6,
"r_x3": 70.03,
"r_y3": 561.6,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition - Volume",
"orig": "Conference on Document Analysis and Recognition - Volume",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 580.29,
"r_x1": 74.51,
"r_y1": 580.29,
"r_x2": 74.51,
"r_y2": 572.56,
"r_x3": 70.03,
"r_y3": 572.56,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.51,
"r_y0": 580.49,
"r_x1": 286.36,
"r_y1": 580.49,
"r_x2": 286.36,
"r_y2": 572.48,
"r_x3": 74.51,
"r_y3": 572.48,
"coord_origin": "TOPLEFT"
},
"text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 591.45,
"r_x1": 90.36,
"r_y1": 591.45,
"r_x2": 90.36,
"r_y2": 583.43,
"r_x3": 70.03,
"r_y3": 583.43,
"coord_origin": "TOPLEFT"
},
"text": "ety. 2",
"orig": "ety. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2"
},
{
"label": "list_item",
"id": 13,
"page_no": 8,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 594.71,
"r": 286.36,
"b": 646.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 602.72,
"r_x1": 66.27,
"r_y1": 602.72,
"r_x2": 66.27,
"r_y2": 594.71,
"r_x3": 50.11,
"r_y3": 594.71,
"coord_origin": "TOPLEFT"
},
"text": "[13]",
"orig": "[13]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 602.72,
"r_x1": 286.36,
"r_y1": 602.72,
"r_x2": 286.36,
"r_y2": 594.71,
"r_x3": 68.7,
"r_y3": 594.71,
"coord_origin": "TOPLEFT"
},
"text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 613.68,
"r_x1": 286.36,
"r_y1": 613.68,
"r_x2": 286.36,
"r_y2": 605.66,
"r_x3": 70.03,
"r_y3": 605.66,
"coord_origin": "TOPLEFT"
},
"text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 624.64,
"r_x1": 286.36,
"r_y1": 624.64,
"r_x2": 286.36,
"r_y2": 616.62,
"r_x3": 70.03,
"r_y3": 616.62,
"coord_origin": "TOPLEFT"
},
"text": "tables in scanned document images using line information.",
"orig": "tables in scanned document images using line information.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 635.6,
"r_x1": 77.5,
"r_y1": 635.6,
"r_x2": 77.5,
"r_y2": 627.58,
"r_x3": 70.03,
"r_y3": 627.58,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.92,
"r_y0": 635.39,
"r_x1": 286.36,
"r_y1": 635.39,
"r_x2": 286.36,
"r_y2": 627.66,
"r_x3": 79.92,
"r_y3": 627.66,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International Conference on Document Analy-",
"orig": "2013 12th International Conference on Document Analy-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 646.35,
"r_x1": 140.68,
"r_y1": 646.35,
"r_x2": 140.68,
"r_y2": 638.62,
"r_x3": 70.03,
"r_y3": 638.62,
"coord_origin": "TOPLEFT"
},
"text": "sis and Recognition",
"orig": "sis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.68,
"r_y0": 646.56,
"r_x1": 264.44,
"r_y1": 646.56,
"r_x2": 264.44,
"r_y2": 638.54,
"r_x3": 140.68,
"r_y3": 638.54,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1185-1189. IEEE, 2013. 2",
"orig": ", pages 1185-1189. IEEE, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2"
},
{
"label": "list_item",
"id": 17,
"page_no": 8,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 649.81,
"r": 286.36,
"b": 679.75,
"coord_origin": "TOPLEFT"
},
"confidence": 0.912,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 657.83,
"r_x1": 66.53,
"r_y1": 657.83,
"r_x2": 66.53,
"r_y2": 649.81,
"r_x3": 50.11,
"r_y3": 649.81,
"coord_origin": "TOPLEFT"
},
"text": "[14]",
"orig": "[14]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 657.83,
"r_x1": 286.36,
"r_y1": 657.83,
"r_x2": 286.36,
"r_y2": 649.81,
"r_x3": 69.0,
"r_y3": 649.81,
"coord_origin": "TOPLEFT"
},
"text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 668.79,
"r_x1": 93.2,
"r_y1": 668.79,
"r_x2": 93.2,
"r_y2": 660.77,
"r_x3": 70.03,
"r_y3": 660.77,
"coord_origin": "TOPLEFT"
},
"text": "Singh.",
"orig": "Singh.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.2,
"r_y0": 668.79,
"r_x1": 286.36,
"r_y1": 668.79,
"r_x2": 286.36,
"r_y2": 660.77,
"r_x3": 102.2,
"r_y3": 660.77,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2021 competition on scientific table image",
"orig": "Icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 679.75,
"r_x1": 172.0,
"r_y1": 679.75,
"r_x2": 172.0,
"r_y2": 671.73,
"r_x3": 70.03,
"r_y3": 671.73,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex, 2021. 2",
"orig": "recognition to latex, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2"
},
{
"label": "list_item",
"id": 16,
"page_no": 8,
"cluster": {
"id": 16,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 683.0,
"r": 286.36,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.912,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 691.02,
"r_x1": 65.52,
"r_y1": 691.02,
"r_x2": 65.52,
"r_y2": 683.0,
"r_x3": 50.11,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "[15]",
"orig": "[15]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.83,
"r_y0": 691.02,
"r_x1": 286.36,
"r_y1": 691.02,
"r_x2": 286.36,
"r_y2": 683.0,
"r_x3": 67.83,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Harold W Kuhn. The hungarian method for the assignment",
"orig": "Harold W Kuhn. The hungarian method for the assignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 701.98,
"r_x1": 102.16,
"r_y1": 701.98,
"r_x2": 102.16,
"r_y2": 693.96,
"r_x3": 70.03,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "problem.",
"orig": "problem.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 107.55,
"r_y0": 701.77,
"r_x1": 231.47,
"r_y1": 701.77,
"r_x2": 231.47,
"r_y2": 694.04,
"r_x3": 107.55,
"r_y3": 694.04,
"coord_origin": "TOPLEFT"
},
"text": "Naval research logistics quarterly",
"orig": "Naval research logistics quarterly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.48,
"r_y0": 701.98,
"r_x1": 286.36,
"r_y1": 701.98,
"r_x2": 286.36,
"r_y2": 693.96,
"r_x3": 231.48,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": ", 2(1-2):83-97,",
"orig": ", 2(1-2):83-97,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 712.94,
"r_x1": 97.92,
"r_y1": 712.94,
"r_x2": 97.92,
"r_y2": 704.92,
"r_x3": 70.03,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "1955. 6",
"orig": "1955. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[15] Harold W Kuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6"
},
{
"label": "list_item",
"id": 6,
"page_no": 8,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 75.88,
"r": 545.11,
"b": 138.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 83.9,
"r_x1": 324.75,
"r_y1": 83.9,
"r_x2": 324.75,
"r_y2": 75.88,
"r_x3": 308.86,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "[16]",
"orig": "[16]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.13,
"r_y0": 83.9,
"r_x1": 545.11,
"r_y1": 83.9,
"r_x2": 545.11,
"r_y2": 75.88,
"r_x3": 327.13,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 94.86,
"r_x1": 545.11,
"r_y1": 94.86,
"r_x2": 545.11,
"r_y2": 86.84,
"r_x3": 328.78,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 105.82,
"r_x1": 390.96,
"r_y1": 105.82,
"r_x2": 390.96,
"r_y2": 97.8,
"r_x3": 328.78,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Tamara L. Berg.",
"orig": "Tamara L. Berg.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.27,
"r_y0": 105.82,
"r_x1": 435.14,
"r_y1": 105.82,
"r_x2": 435.14,
"r_y2": 97.8,
"r_x3": 400.27,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Babytalk:",
"orig": "Babytalk:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.71,
"r_y0": 105.82,
"r_x1": 545.11,
"r_y1": 105.82,
"r_x2": 545.11,
"r_y2": 97.8,
"r_x3": 441.71,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Understanding and generat-",
"orig": "Understanding and generat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 116.78,
"r_x1": 440.81,
"r_y1": 116.78,
"r_x2": 440.81,
"r_y2": 108.76,
"r_x3": 328.78,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "ing simple image descriptions.",
"orig": "ing simple image descriptions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 446.63,
"r_y0": 116.57,
"r_x1": 545.11,
"r_y1": 116.57,
"r_x2": 545.11,
"r_y2": 108.84,
"r_x3": 446.63,
"r_y3": 108.84,
"coord_origin": "TOPLEFT"
},
"text": "IEEE Transactions on Pat-",
"orig": "IEEE Transactions on Pat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 127.53,
"r_x1": 471.13,
"r_y1": 127.53,
"r_x2": 471.13,
"r_y2": 119.8,
"r_x3": 328.78,
"r_y3": 119.8,
"coord_origin": "TOPLEFT"
},
"text": "tern Analysis and Machine Intelligence",
"orig": "tern Analysis and Machine Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 471.13,
"r_y0": 127.73,
"r_x1": 545.11,
"r_y1": 127.73,
"r_x2": 545.11,
"r_y2": 119.72,
"r_x3": 471.13,
"r_y3": 119.72,
"coord_origin": "TOPLEFT"
},
"text": ", 35(12):2891-2903,",
"orig": ", 35(12):2891-2903,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 138.69,
"r_x1": 356.67,
"r_y1": 138.69,
"r_x2": 356.67,
"r_y2": 130.68,
"r_x3": 328.78,
"r_y3": 130.68,
"coord_origin": "TOPLEFT"
},
"text": "2013. 4",
"orig": "2013. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4"
},
{
"label": "list_item",
"id": 15,
"page_no": 8,
"cluster": {
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 142.12,
"r": 545.11,
"b": 172.06,
"coord_origin": "TOPLEFT"
},
"confidence": 0.925,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 150.14,
"r_x1": 325.24,
"r_y1": 150.14,
"r_x2": 325.24,
"r_y2": 142.12,
"r_x3": 308.86,
"r_y3": 142.12,
"coord_origin": "TOPLEFT"
},
"text": "[17]",
"orig": "[17]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 150.14,
"r_x1": 545.11,
"r_y1": 150.14,
"r_x2": 545.11,
"r_y2": 142.12,
"r_x3": 327.7,
"r_y3": 142.12,
"coord_origin": "TOPLEFT"
},
"text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 161.1,
"r_x1": 414.45,
"r_y1": 161.1,
"r_x2": 414.45,
"r_y2": 153.08,
"r_x3": 328.78,
"r_y3": 153.08,
"coord_origin": "TOPLEFT"
},
"text": "Zhou, and Zhoujun Li.",
"orig": "Zhou, and Zhoujun Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 421.83,
"r_y0": 161.1,
"r_x1": 545.11,
"r_y1": 161.1,
"r_x2": 545.11,
"r_y2": 153.08,
"r_x3": 421.83,
"r_y3": 153.08,
"coord_origin": "TOPLEFT"
},
"text": "Tablebank: A benchmark dataset",
"orig": "Tablebank: A benchmark dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 172.06,
"r_x1": 493.63,
"r_y1": 172.06,
"r_x2": 493.63,
"r_y2": 164.04,
"r_x3": 328.78,
"r_y3": 164.04,
"coord_origin": "TOPLEFT"
},
"text": "for table detection and recognition, 2019. 2, 3",
"orig": "for table detection and recognition, 2019. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3"
},
{
"label": "list_item",
"id": 12,
"page_no": 8,
"cluster": {
"id": 12,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 175.49,
"r": 545.11,
"b": 260.21,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 183.5,
"r_x1": 324.27,
"r_y1": 183.5,
"r_x2": 324.27,
"r_y2": 175.49,
"r_x3": 308.86,
"r_y3": 175.49,
"coord_origin": "TOPLEFT"
},
"text": "[18]",
"orig": "[18]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.58,
"r_y0": 183.5,
"r_x1": 545.11,
"r_y1": 183.5,
"r_x2": 545.11,
"r_y2": 175.49,
"r_x3": 326.58,
"r_y3": 175.49,
"coord_origin": "TOPLEFT"
},
"text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 194.46,
"r_x1": 545.11,
"r_y1": 194.46,
"r_x2": 545.11,
"r_y2": 186.45,
"r_x3": 328.78,
"r_y3": 186.45,
"coord_origin": "TOPLEFT"
},
"text": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 205.42,
"r_x1": 545.11,
"r_y1": 205.42,
"r_x2": 545.11,
"r_y2": 197.4,
"r_x3": 328.78,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 216.38,
"r_x1": 545.11,
"r_y1": 216.38,
"r_x2": 545.11,
"r_y2": 208.36,
"r_x3": 328.78,
"r_y3": 208.36,
"coord_origin": "TOPLEFT"
},
"text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 227.34,
"r_x1": 479.26,
"r_y1": 227.34,
"r_x2": 479.26,
"r_y2": 219.32,
"r_x3": 328.78,
"r_y3": 219.32,
"coord_origin": "TOPLEFT"
},
"text": "Escalante, and Roberto Vezzani, editors,",
"orig": "Escalante, and Roberto Vezzani, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.12,
"r_y0": 227.13,
"r_x1": 545.11,
"r_y1": 227.13,
"r_x2": 545.11,
"r_y2": 219.4,
"r_x3": 483.12,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "Pattern Recogni-",
"orig": "Pattern Recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 238.09,
"r_x1": 519.4,
"r_y1": 238.09,
"r_x2": 519.4,
"r_y2": 230.36,
"r_x3": 328.78,
"r_y3": 230.36,
"coord_origin": "TOPLEFT"
},
"text": "tion. ICPR International Workshops and Challenges",
"orig": "tion. ICPR International Workshops and Challenges",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 519.4,
"r_y0": 238.3,
"r_x1": 545.11,
"r_y1": 238.3,
"r_x2": 545.11,
"r_y2": 230.28,
"r_x3": 519.4,
"r_y3": 230.28,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 249.26,
"r_x1": 545.11,
"r_y1": 249.26,
"r_x2": 545.11,
"r_y2": 241.24,
"r_x3": 328.78,
"r_y3": 241.24,
"coord_origin": "TOPLEFT"
},
"text": "644-658, Cham, 2021. Springer International Publishing. 2,",
"orig": "644-658, Cham, 2021. Springer International Publishing. 2,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 260.21,
"r_x1": 333.26,
"r_y1": 260.21,
"r_x2": 333.26,
"r_y2": 252.2,
"r_x3": 328.78,
"r_y3": 252.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3"
},
{
"label": "list_item",
"id": 8,
"page_no": 8,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 263.64,
"r": 545.11,
"b": 326.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.937,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 271.66,
"r_x1": 324.26,
"r_y1": 271.66,
"r_x2": 324.26,
"r_y2": 263.64,
"r_x3": 308.86,
"r_y3": 263.64,
"coord_origin": "TOPLEFT"
},
"text": "[19]",
"orig": "[19]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.58,
"r_y0": 271.66,
"r_x1": 545.11,
"r_y1": 271.66,
"r_x2": 545.11,
"r_y2": 263.64,
"r_x3": 326.58,
"r_y3": 263.64,
"coord_origin": "TOPLEFT"
},
"text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 282.62,
"r_x1": 545.11,
"r_y1": 282.62,
"r_x2": 545.11,
"r_y2": 274.6,
"r_x3": 328.78,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 293.58,
"r_x1": 545.11,
"r_y1": 293.58,
"r_x2": 545.11,
"r_y2": 285.56,
"r_x3": 328.78,
"r_y3": 285.56,
"coord_origin": "TOPLEFT"
},
"text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 304.54,
"r_x1": 545.11,
"r_y1": 304.54,
"r_x2": 545.11,
"r_y2": 296.52,
"r_x3": 328.78,
"r_y3": 296.52,
"coord_origin": "TOPLEFT"
},
"text": "bust pdf document conversion using recurrent neural net-",
"orig": "bust pdf document conversion using recurrent neural net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 315.5,
"r_x1": 352.85,
"r_y1": 315.5,
"r_x2": 352.85,
"r_y2": 307.48,
"r_x3": 328.78,
"r_y3": 307.48,
"coord_origin": "TOPLEFT"
},
"text": "works.",
"orig": "works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.24,
"r_y0": 315.29,
"r_x1": 545.11,
"r_y1": 315.29,
"r_x2": 545.11,
"r_y2": 307.56,
"r_x3": 360.24,
"r_y3": 307.56,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the AAAI Conference on Artificial",
"orig": "Proceedings of the AAAI Conference on Artificial",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 326.25,
"r_x1": 371.02,
"r_y1": 326.25,
"r_x2": 371.02,
"r_y2": 318.52,
"r_x3": 328.78,
"r_y3": 318.52,
"coord_origin": "TOPLEFT"
},
"text": "Intelligence",
"orig": "Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.02,
"r_y0": 326.45,
"r_x1": 502.26,
"r_y1": 326.45,
"r_x2": 502.26,
"r_y2": 318.44,
"r_x3": 371.02,
"r_y3": 318.44,
"coord_origin": "TOPLEFT"
},
"text": ", 35(17):15137-15145, May 2021. 1",
"orig": ", 35(17):15137-15145, May 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1"
},
{
"label": "list_item",
"id": 18,
"page_no": 8,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 329.88,
"r": 545.12,
"b": 370.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.903,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 337.9,
"r_x1": 323.83,
"r_y1": 337.9,
"r_x2": 323.83,
"r_y2": 329.88,
"r_x3": 308.86,
"r_y3": 329.88,
"coord_origin": "TOPLEFT"
},
"text": "[20]",
"orig": "[20]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.07,
"r_y0": 337.9,
"r_x1": 545.11,
"r_y1": 337.9,
"r_x2": 545.11,
"r_y2": 329.88,
"r_x3": 326.07,
"r_y3": 329.88,
"coord_origin": "TOPLEFT"
},
"text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 348.86,
"r_x1": 545.11,
"r_y1": 348.86,
"r_x2": 545.11,
"r_y2": 340.84,
"r_x3": 328.78,
"r_y3": 340.84,
"coord_origin": "TOPLEFT"
},
"text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 359.82,
"r_x1": 382.78,
"r_y1": 359.82,
"r_x2": 382.78,
"r_y2": 351.8,
"r_x3": 328.78,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "in the wild. In",
"orig": "in the wild. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.54,
"r_y0": 359.61,
"r_x1": 545.12,
"r_y1": 359.61,
"r_x2": 545.12,
"r_y2": 351.88,
"r_x3": 385.54,
"r_y3": 351.88,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF International",
"orig": "Proceedings of the IEEE/CVF International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 370.57,
"r_x1": 443.6,
"r_y1": 370.57,
"r_x2": 443.6,
"r_y2": 362.84,
"r_x3": 328.78,
"r_y3": 362.84,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision",
"orig": "Conference on Computer Vision",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 443.59,
"r_y0": 370.78,
"r_x1": 534.49,
"r_y1": 370.78,
"r_x2": 534.49,
"r_y2": 362.76,
"r_x3": 443.59,
"r_y3": 362.76,
"coord_origin": "TOPLEFT"
},
"text": ", pages 944-952, 2021. 2",
"orig": ", pages 944-952, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2"
},
{
"label": "list_item",
"id": 21,
"page_no": 8,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 374.21,
"r": 545.11,
"b": 437.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.883,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 382.22,
"r_x1": 324.6,
"r_y1": 382.22,
"r_x2": 324.6,
"r_y2": 374.21,
"r_x3": 308.86,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "[21]",
"orig": "[21]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.96,
"r_y0": 382.22,
"r_x1": 362.66,
"r_y1": 382.22,
"r_x2": 362.66,
"r_y2": 374.21,
"r_x3": 326.96,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Shubham",
"orig": "Shubham",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.69,
"r_y0": 382.22,
"r_x1": 389.61,
"r_y1": 382.22,
"r_x2": 389.61,
"r_y2": 374.21,
"r_x3": 368.69,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Singh",
"orig": "Singh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 395.65,
"r_y0": 382.22,
"r_x1": 424.56,
"r_y1": 382.22,
"r_x2": 424.56,
"r_y2": 374.21,
"r_x3": 395.65,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Paliwal,",
"orig": "Paliwal,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.55,
"r_y0": 382.22,
"r_x1": 438.02,
"r_y1": 382.22,
"r_x2": 438.02,
"r_y2": 374.21,
"r_x3": 431.55,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "D",
"orig": "D",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.06,
"r_y0": 382.22,
"r_x1": 488.5,
"r_y1": 382.22,
"r_x2": 488.5,
"r_y2": 374.21,
"r_x3": 444.06,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Vishwanath,",
"orig": "Vishwanath,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.48,
"r_y0": 382.22,
"r_x1": 515.41,
"r_y1": 382.22,
"r_x2": 515.41,
"r_y2": 374.21,
"r_x3": 495.48,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Rohit",
"orig": "Rohit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 521.45,
"r_y0": 382.22,
"r_x1": 545.11,
"r_y1": 382.22,
"r_x2": 545.11,
"r_y2": 374.21,
"r_x3": 521.45,
"r_y3": 374.21,
"coord_origin": "TOPLEFT"
},
"text": "Rahul,",
"orig": "Rahul,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 393.18,
"r_x1": 545.11,
"r_y1": 393.18,
"r_x2": 545.11,
"r_y2": 385.17,
"r_x3": 328.78,
"r_y3": 385.17,
"coord_origin": "TOPLEFT"
},
"text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 404.14,
"r_x1": 545.11,
"r_y1": 404.14,
"r_x2": 545.11,
"r_y2": 396.12,
"r_x3": 328.78,
"r_y3": 396.12,
"coord_origin": "TOPLEFT"
},
"text": "ing model for end-to-end table detection and tabular data ex-",
"orig": "ing model for end-to-end table detection and tabular data ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 415.1,
"r_x1": 478.01,
"r_y1": 415.1,
"r_x2": 478.01,
"r_y2": 407.08,
"r_x3": 328.78,
"r_y3": 407.08,
"coord_origin": "TOPLEFT"
},
"text": "traction from scanned document images.",
"orig": "traction from scanned document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 484.07,
"r_y0": 415.1,
"r_x1": 491.54,
"r_y1": 415.1,
"r_x2": 491.54,
"r_y2": 407.08,
"r_x3": 484.07,
"r_y3": 407.08,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.67,
"r_y0": 414.89,
"r_x1": 545.11,
"r_y1": 414.89,
"r_x2": 545.11,
"r_y2": 407.16,
"r_x3": 494.67,
"r_y3": 407.16,
"coord_origin": "TOPLEFT"
},
"text": "2019 Interna-",
"orig": "2019 Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 425.85,
"r_x1": 545.11,
"r_y1": 425.85,
"r_x2": 545.11,
"r_y2": 418.12,
"r_x3": 328.78,
"r_y3": 418.12,
"coord_origin": "TOPLEFT"
},
"text": "tional Conference on Document Analysis and Recognition",
"orig": "tional Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 436.81,
"r_x1": 360.84,
"r_y1": 436.81,
"r_x2": 360.84,
"r_y2": 429.08,
"r_x3": 328.78,
"r_y3": 429.08,
"coord_origin": "TOPLEFT"
},
"text": "(ICDAR)",
"orig": "(ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.84,
"r_y0": 437.02,
"r_x1": 475.63,
"r_y1": 437.02,
"r_x2": 475.63,
"r_y2": 429.0,
"r_x3": 360.84,
"r_y3": 429.0,
"coord_origin": "TOPLEFT"
},
"text": ", pages 128-133. IEEE, 2019. 1",
"orig": ", pages 128-133. IEEE, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1"
},
{
"label": "list_item",
"id": 20,
"page_no": 8,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 440.45,
"r": 545.11,
"b": 558.05,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.46,
"r_x1": 324.57,
"r_y1": 448.46,
"r_x2": 324.57,
"r_y2": 440.45,
"r_x3": 308.86,
"r_y3": 440.45,
"coord_origin": "TOPLEFT"
},
"text": "[22]",
"orig": "[22]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.93,
"r_y0": 448.46,
"r_x1": 545.11,
"r_y1": 448.46,
"r_x2": 545.11,
"r_y2": 440.45,
"r_x3": 326.93,
"r_y3": 440.45,
"coord_origin": "TOPLEFT"
},
"text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 459.42,
"r_x1": 545.11,
"r_y1": 459.42,
"r_x2": 545.11,
"r_y2": 451.41,
"r_x3": 328.78,
"r_y3": 451.41,
"coord_origin": "TOPLEFT"
},
"text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 470.38,
"r_x1": 545.11,
"r_y1": 470.38,
"r_x2": 545.11,
"r_y2": 462.36,
"r_x3": 328.78,
"r_y3": 462.36,
"coord_origin": "TOPLEFT"
},
"text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 481.34,
"r_x1": 545.11,
"r_y1": 481.34,
"r_x2": 545.11,
"r_y2": 473.32,
"r_x3": 328.78,
"r_y3": 473.32,
"coord_origin": "TOPLEFT"
},
"text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 492.3,
"r_x1": 545.11,
"r_y1": 492.3,
"r_x2": 545.11,
"r_y2": 484.28,
"r_x3": 328.78,
"r_y3": 484.28,
"coord_origin": "TOPLEFT"
},
"text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 503.26,
"r_x1": 545.11,
"r_y1": 503.26,
"r_x2": 545.11,
"r_y2": 495.24,
"r_x3": 328.78,
"r_y3": 495.24,
"coord_origin": "TOPLEFT"
},
"text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 514.22,
"r_x1": 545.11,
"r_y1": 514.22,
"r_x2": 545.11,
"r_y2": 506.2,
"r_x3": 328.78,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "perative style, high-performance deep learning library. In H.",
"orig": "perative style, high-performance deep learning library. In H.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 525.17,
"r_x1": 545.11,
"r_y1": 525.17,
"r_x2": 545.11,
"r_y2": 517.16,
"r_x3": 328.78,
"r_y3": 517.16,
"coord_origin": "TOPLEFT"
},
"text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 536.13,
"r_x1": 434.57,
"r_y1": 536.13,
"r_x2": 434.57,
"r_y2": 528.12,
"r_x3": 328.78,
"r_y3": 528.12,
"coord_origin": "TOPLEFT"
},
"text": "Fox, and R. Garnett, editors,",
"orig": "Fox, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.86,
"r_y0": 535.93,
"r_x1": 545.11,
"r_y1": 535.93,
"r_x2": 545.11,
"r_y2": 528.2,
"r_x3": 437.86,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural Informa-",
"orig": "Advances in Neural Informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 546.89,
"r_x1": 425.73,
"r_y1": 546.89,
"r_x2": 425.73,
"r_y2": 539.16,
"r_x3": 328.78,
"r_y3": 539.16,
"coord_origin": "TOPLEFT"
},
"text": "tion Processing Systems 32",
"orig": "tion Processing Systems 32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 425.74,
"r_y0": 547.09,
"r_x1": 545.11,
"r_y1": 547.09,
"r_x2": 545.11,
"r_y2": 539.08,
"r_x3": 425.74,
"r_y3": 539.08,
"coord_origin": "TOPLEFT"
},
"text": ", pages 8024-8035. Curran Asso-",
"orig": ", pages 8024-8035. Curran Asso-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 558.05,
"r_x1": 399.74,
"r_y1": 558.05,
"r_x2": 399.74,
"r_y2": 550.03,
"r_x3": 328.78,
"r_y3": 550.03,
"coord_origin": "TOPLEFT"
},
"text": "ciates, Inc., 2019. 6",
"orig": "ciates, Inc., 2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E. Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6"
},
{
"label": "list_item",
"id": 19,
"page_no": 8,
"cluster": {
"id": 19,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 561.48,
"r": 545.11,
"b": 624.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.903,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 569.5,
"r_x1": 324.5,
"r_y1": 569.5,
"r_x2": 324.5,
"r_y2": 561.48,
"r_x3": 308.86,
"r_y3": 561.48,
"coord_origin": "TOPLEFT"
},
"text": "[23]",
"orig": "[23]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.85,
"r_y0": 569.5,
"r_x1": 545.11,
"r_y1": 569.5,
"r_x2": 545.11,
"r_y2": 561.48,
"r_x3": 326.85,
"r_y3": 561.48,
"coord_origin": "TOPLEFT"
},
"text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 580.46,
"r_x1": 545.11,
"r_y1": 580.46,
"r_x2": 545.11,
"r_y2": 572.44,
"r_x3": 328.78,
"r_y3": 572.44,
"coord_origin": "TOPLEFT"
},
"text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 591.41,
"r_x1": 545.11,
"r_y1": 591.41,
"r_x2": 545.11,
"r_y2": 583.4,
"r_x3": 328.78,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "for end to end table detection and structure recognition from",
"orig": "for end to end table detection and structure recognition from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 602.37,
"r_x1": 431.62,
"r_y1": 602.37,
"r_x2": 431.62,
"r_y2": 594.36,
"r_x3": 328.78,
"r_y3": 594.36,
"coord_origin": "TOPLEFT"
},
"text": "image-based documents. In",
"orig": "image-based documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.69,
"r_y0": 602.17,
"r_x1": 545.11,
"r_y1": 602.17,
"r_x2": 545.11,
"r_y2": 594.44,
"r_x3": 434.69,
"r_y3": 594.44,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF",
"orig": "Proceedings of the IEEE/CVF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 613.13,
"r_x1": 545.11,
"r_y1": 613.13,
"r_x2": 545.11,
"r_y2": 605.4,
"r_x3": 328.78,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision and Pattern Recognition",
"orig": "Conference on Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 624.08,
"r_x1": 367.8,
"r_y1": 624.08,
"r_x2": 367.8,
"r_y2": 616.36,
"r_x3": 328.78,
"r_y3": 616.36,
"coord_origin": "TOPLEFT"
},
"text": "Workshops",
"orig": "Workshops",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.8,
"r_y0": 624.29,
"r_x1": 458.69,
"r_y1": 624.29,
"r_x2": 458.69,
"r_y2": 616.28,
"r_x3": 367.8,
"r_y3": 616.28,
"coord_origin": "TOPLEFT"
},
"text": ", pages 572-573, 2020. 1",
"orig": ", pages 572-573, 2020. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1"
},
{
"label": "list_item",
"id": 23,
"page_no": 8,
"cluster": {
"id": 23,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 627.72,
"r": 545.12,
"b": 668.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.878,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 635.74,
"r_x1": 324.69,
"r_y1": 635.74,
"r_x2": 324.69,
"r_y2": 627.72,
"r_x3": 308.86,
"r_y3": 627.72,
"coord_origin": "TOPLEFT"
},
"text": "[24]",
"orig": "[24]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.07,
"r_y0": 635.74,
"r_x1": 545.11,
"r_y1": 635.74,
"r_x2": 545.11,
"r_y2": 627.72,
"r_x3": 327.07,
"r_y3": 627.72,
"coord_origin": "TOPLEFT"
},
"text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 646.7,
"r_x1": 545.11,
"r_y1": 646.7,
"r_x2": 545.11,
"r_y2": 638.68,
"r_x3": 328.78,
"r_y3": 638.68,
"coord_origin": "TOPLEFT"
},
"text": "Rethinking table recognition using graph neural networks.",
"orig": "Rethinking table recognition using graph neural networks.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 657.65,
"r_x1": 336.25,
"r_y1": 657.65,
"r_x2": 336.25,
"r_y2": 649.64,
"r_x3": 328.78,
"r_y3": 649.64,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 338.1,
"r_y0": 657.45,
"r_x1": 545.12,
"r_y1": 657.45,
"r_x2": 545.12,
"r_y2": 649.72,
"r_x3": 338.1,
"r_y3": 649.72,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 668.41,
"r_x1": 406.32,
"r_y1": 668.41,
"r_x2": 406.32,
"r_y2": 660.68,
"r_x3": 328.78,
"r_y3": 660.68,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.32,
"r_y0": 668.61,
"r_x1": 521.12,
"r_y1": 668.61,
"r_x2": 521.12,
"r_y2": 660.6,
"r_x3": 406.32,
"r_y3": 660.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 142-147. IEEE, 2019. 3",
"orig": ", pages 142-147. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 24,
"page_no": 8,
"cluster": {
"id": 24,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 672.04,
"r": 545.11,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.865,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 680.06,
"r_x1": 324.71,
"r_y1": 680.06,
"r_x2": 324.71,
"r_y2": 672.04,
"r_x3": 308.86,
"r_y3": 672.04,
"coord_origin": "TOPLEFT"
},
"text": "[25]",
"orig": "[25]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.09,
"r_y0": 680.06,
"r_x1": 545.11,
"r_y1": 680.06,
"r_x2": 545.11,
"r_y2": 672.04,
"r_x3": 327.09,
"r_y3": 672.04,
"coord_origin": "TOPLEFT"
},
"text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 691.02,
"r_x1": 482.81,
"r_y1": 691.02,
"r_x2": 482.81,
"r_y2": 683.0,
"r_x3": 328.78,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Sadeghian, Ian Reid, and Silvio Savarese.",
"orig": "Sadeghian, Ian Reid, and Silvio Savarese.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.75,
"r_y0": 691.02,
"r_x1": 545.11,
"r_y1": 691.02,
"r_x2": 545.11,
"r_y2": 683.0,
"r_x3": 488.75,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Generalized in-",
"orig": "Generalized in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 701.98,
"r_x1": 545.11,
"r_y1": 701.98,
"r_x2": 545.11,
"r_y2": 693.96,
"r_x3": 328.78,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "tersection over union: A metric and a loss for bounding box",
"orig": "tersection over union: A metric and a loss for bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 712.94,
"r_x1": 379.15,
"r_y1": 712.94,
"r_x2": 379.15,
"r_y2": 704.92,
"r_x3": 328.78,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "regression. In",
"orig": "regression. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 381.62,
"r_y0": 712.73,
"r_x1": 545.11,
"r_y1": 712.73,
"r_x2": 545.11,
"r_y2": 705.0,
"r_x3": 381.62,
"r_y3": 705.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF Conference on",
"orig": "Proceedings of the IEEE/CVF Conference on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on"
}
],
"headers": [
{
"label": "page_footer",
"id": 22,
"page_no": 8,
"cluster": {
"id": 22,
"label": "page_footer",
"bbox": {
"l": 295.12,
"t": 734.13,
"r": 300.1,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.12,
"r_y0": 743.04,
"r_x1": 300.1,
"r_y1": 743.04,
"r_x2": 300.1,
"r_y2": 734.13,
"r_x3": 295.12,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9"
}
]
}
},
{
"page_no": 9,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 83.69,
"r_x1": 223.58,
"r_y1": 83.69,
"r_x2": 223.58,
"r_y2": 75.96,
"r_x3": 70.03,
"r_y3": 75.96,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision and Pattern Recognition",
"orig": "Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 223.58,
"r_y0": 83.9,
"r_x1": 286.36,
"r_y1": 83.9,
"r_x2": 286.36,
"r_y2": 75.88,
"r_x3": 223.58,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": ", pages 658-666,",
"orig": ", pages 658-666,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 94.86,
"r_x1": 97.92,
"r_y1": 94.86,
"r_x2": 97.92,
"r_y2": 86.84,
"r_x3": 70.03,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "2019. 6",
"orig": "2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 106.18,
"r_x1": 65.53,
"r_y1": 106.18,
"r_x2": 65.53,
"r_y2": 98.17,
"r_x3": 50.11,
"r_y3": 98.17,
"coord_origin": "TOPLEFT"
},
"text": "[26]",
"orig": "[26]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.85,
"r_y0": 106.18,
"r_x1": 286.36,
"r_y1": 106.18,
"r_x2": 286.36,
"r_y2": 98.17,
"r_x3": 67.85,
"r_y3": 98.17,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 117.14,
"r_x1": 286.36,
"r_y1": 117.14,
"r_x2": 286.36,
"r_y2": 109.12,
"r_x3": 70.03,
"r_y3": 109.12,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 128.1,
"r_x1": 286.36,
"r_y1": 128.1,
"r_x2": 286.36,
"r_y2": 120.08,
"r_x3": 70.03,
"r_y3": 120.08,
"coord_origin": "TOPLEFT"
},
"text": "tion and structure recognition of tables in document images.",
"orig": "tion and structure recognition of tables in document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 139.06,
"r_x1": 77.5,
"r_y1": 139.06,
"r_x2": 77.5,
"r_y2": 131.04,
"r_x3": 70.03,
"r_y3": 131.04,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 80.56,
"r_y0": 138.85,
"r_x1": 286.37,
"r_y1": 138.85,
"r_x2": 286.37,
"r_y2": 131.12,
"r_x3": 80.56,
"r_y3": 131.12,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR International Conference on Document",
"orig": "2017 14th IAPR International Conference on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 149.81,
"r_x1": 195.23,
"r_y1": 149.81,
"r_x2": 195.23,
"r_y2": 142.08,
"r_x3": 70.03,
"r_y3": 142.08,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (ICDAR)",
"orig": "Analysis and Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.23,
"r_y0": 150.02,
"r_x1": 286.37,
"r_y1": 150.02,
"r_x2": 286.37,
"r_y2": 142.0,
"r_x3": 195.23,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": ", volume 01, pages 1162-",
"orig": ", volume 01, pages 1162-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 160.98,
"r_x1": 120.33,
"r_y1": 160.98,
"r_x2": 120.33,
"r_y2": 152.96,
"r_x3": 70.03,
"r_y3": 152.96,
"coord_origin": "TOPLEFT"
},
"text": "1167, 2017. 1",
"orig": "1167, 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 172.3,
"r_x1": 65.53,
"r_y1": 172.3,
"r_x2": 65.53,
"r_y2": 164.28,
"r_x3": 50.11,
"r_y3": 164.28,
"coord_origin": "TOPLEFT"
},
"text": "[27]",
"orig": "[27]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.85,
"r_y0": 172.3,
"r_x1": 286.36,
"r_y1": 172.3,
"r_x2": 286.36,
"r_y2": 164.28,
"r_x3": 67.85,
"r_y3": 164.28,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 183.26,
"r_x1": 286.36,
"r_y1": 183.26,
"r_x2": 286.36,
"r_y2": 175.24,
"r_x3": 70.03,
"r_y3": 175.24,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 194.22,
"r_x1": 286.36,
"r_y1": 194.22,
"r_x2": 286.36,
"r_y2": 186.2,
"r_x3": 70.03,
"r_y3": 186.2,
"coord_origin": "TOPLEFT"
},
"text": "tection and structure recognition of tables in document im-",
"orig": "tection and structure recognition of tables in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 205.18,
"r_x1": 101.33,
"r_y1": 205.18,
"r_x2": 101.33,
"r_y2": 197.16,
"r_x3": 70.03,
"r_y3": 197.16,
"coord_origin": "TOPLEFT"
},
"text": "ages. In",
"orig": "ages. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.33,
"r_y0": 204.97,
"r_x1": 286.36,
"r_y1": 204.97,
"r_x2": 286.36,
"r_y2": 197.24,
"r_x3": 104.33,
"r_y3": 197.24,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR international conference on doc-",
"orig": "2017 14th IAPR international conference on doc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 215.93,
"r_x1": 220.49,
"r_y1": 215.93,
"r_x2": 220.49,
"r_y2": 208.2,
"r_x3": 70.03,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "ument analysis and recognition (ICDAR)",
"orig": "ument analysis and recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.48,
"r_y0": 216.14,
"r_x1": 286.36,
"r_y1": 216.14,
"r_x2": 286.36,
"r_y2": 208.12,
"r_x3": 220.48,
"r_y3": 208.12,
"coord_origin": "TOPLEFT"
},
"text": ", volume 1, pages",
"orig": ", volume 1, pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 227.09,
"r_x1": 166.65,
"r_y1": 227.09,
"r_x2": 166.65,
"r_y2": 219.08,
"r_x3": 70.03,
"r_y3": 219.08,
"coord_origin": "TOPLEFT"
},
"text": "1162-1167. IEEE, 2017. 3",
"orig": "1162-1167. IEEE, 2017. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 238.42,
"r_x1": 65.65,
"r_y1": 238.42,
"r_x2": 65.65,
"r_y2": 230.4,
"r_x3": 50.11,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "[28]",
"orig": "[28]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.98,
"r_y0": 238.42,
"r_x1": 286.36,
"r_y1": 238.42,
"r_x2": 286.36,
"r_y2": 230.4,
"r_x3": 67.98,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 249.38,
"r_x1": 147.17,
"r_y1": 249.38,
"r_x2": 147.17,
"r_y2": 241.36,
"r_x3": 70.03,
"r_y3": 241.36,
"coord_origin": "TOPLEFT"
},
"text": "neous documents. In",
"orig": "neous documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.93,
"r_y0": 249.17,
"r_x1": 286.37,
"r_y1": 249.17,
"r_x2": 286.37,
"r_y2": 241.44,
"r_x3": 149.93,
"r_y3": 241.44,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the 9th IAPR Interna-",
"orig": "Proceedings of the 9th IAPR Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 260.13,
"r_x1": 244.69,
"r_y1": 260.13,
"r_x2": 244.69,
"r_y2": 252.4,
"r_x3": 70.03,
"r_y3": 252.4,
"coord_origin": "TOPLEFT"
},
"text": "tional Workshop on Document Analysis Systems",
"orig": "tional Workshop on Document Analysis Systems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 244.69,
"r_y0": 260.34,
"r_x1": 286.36,
"r_y1": 260.34,
"r_x2": 286.36,
"r_y2": 252.32,
"r_x3": 244.69,
"r_y3": 252.32,
"coord_origin": "TOPLEFT"
},
"text": ", pages 65-",
"orig": ", pages 65-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 271.3,
"r_x1": 111.37,
"r_y1": 271.3,
"r_x2": 111.37,
"r_y2": 263.28,
"r_x3": 70.03,
"r_y3": 263.28,
"coord_origin": "TOPLEFT"
},
"text": "72, 2010. 2",
"orig": "72, 2010. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 282.62,
"r_x1": 66.02,
"r_y1": 282.62,
"r_x2": 66.02,
"r_y2": 274.6,
"r_x3": 50.11,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "[29]",
"orig": "[29]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.41,
"r_y0": 282.62,
"r_x1": 94.94,
"r_y1": 282.62,
"r_x2": 94.94,
"r_y2": 274.6,
"r_x3": 68.41,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Shoaib",
"orig": "Shoaib",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 100.87,
"r_y0": 282.62,
"r_x1": 127.27,
"r_y1": 282.62,
"r_x2": 127.27,
"r_y2": 274.6,
"r_x3": 100.87,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed",
"orig": "Ahmed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.19,
"r_y0": 282.62,
"r_x1": 165.83,
"r_y1": 282.62,
"r_x2": 165.83,
"r_y2": 274.6,
"r_x3": 133.19,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Siddiqui,",
"orig": "Siddiqui,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 172.68,
"r_y0": 282.62,
"r_x1": 194.09,
"r_y1": 282.62,
"r_x2": 194.09,
"r_y2": 274.6,
"r_x3": 172.68,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Imran",
"orig": "Imran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.02,
"r_y0": 282.62,
"r_x1": 211.48,
"r_y1": 282.62,
"r_x2": 211.48,
"r_y2": 274.6,
"r_x3": 200.02,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ali",
"orig": "Ali",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.41,
"r_y0": 282.62,
"r_x1": 239.44,
"r_y1": 282.62,
"r_x2": 239.44,
"r_y2": 274.6,
"r_x3": 217.41,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Fateh,",
"orig": "Fateh,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.29,
"r_y0": 282.62,
"r_x1": 264.22,
"r_y1": 282.62,
"r_x2": 264.22,
"r_y2": 274.6,
"r_x3": 246.29,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Syed",
"orig": "Syed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.15,
"r_y0": 282.62,
"r_x1": 286.36,
"r_y1": 282.62,
"r_x2": 286.36,
"r_y2": 274.6,
"r_x3": 270.15,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Tah-",
"orig": "Tah-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 293.58,
"r_x1": 286.36,
"r_y1": 293.58,
"r_x2": 286.36,
"r_y2": 285.56,
"r_x3": 70.03,
"r_y3": 285.56,
"coord_origin": "TOPLEFT"
},
"text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 304.54,
"r_x1": 286.36,
"r_y1": 304.54,
"r_x2": 286.36,
"r_y2": 296.52,
"r_x3": 70.03,
"r_y3": 296.52,
"coord_origin": "TOPLEFT"
},
"text": "Deeptabstr: Deep learning based table structure recognition.",
"orig": "Deeptabstr: Deep learning based table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 315.5,
"r_x1": 77.5,
"r_y1": 315.5,
"r_x2": 77.5,
"r_y2": 307.48,
"r_x3": 70.03,
"r_y3": 307.48,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.35,
"r_y0": 315.29,
"r_x1": 286.37,
"r_y1": 315.29,
"r_x2": 286.37,
"r_y2": 307.56,
"r_x3": 79.35,
"r_y3": 307.56,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 326.25,
"r_x1": 147.57,
"r_y1": 326.25,
"r_x2": 147.57,
"r_y2": 318.52,
"r_x3": 70.03,
"r_y3": 318.52,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.57,
"r_y0": 326.45,
"r_x1": 271.34,
"r_y1": 326.45,
"r_x2": 271.34,
"r_y2": 318.44,
"r_x3": 147.57,
"r_y3": 318.44,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1403-1409. IEEE, 2019. 3",
"orig": ", pages 1403-1409. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 337.78,
"r_x1": 65.37,
"r_y1": 337.78,
"r_x2": 65.37,
"r_y2": 329.76,
"r_x3": 50.11,
"r_y3": 329.76,
"coord_origin": "TOPLEFT"
},
"text": "[30]",
"orig": "[30]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.66,
"r_y0": 337.78,
"r_x1": 286.36,
"r_y1": 337.78,
"r_x2": 286.36,
"r_y2": 329.76,
"r_x3": 67.66,
"r_y3": 329.76,
"coord_origin": "TOPLEFT"
},
"text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 348.74,
"r_x1": 286.36,
"r_y1": 348.74,
"r_x2": 286.36,
"r_y2": 340.72,
"r_x3": 70.03,
"r_y3": 340.72,
"coord_origin": "TOPLEFT"
},
"text": "Bekas. Corpus conversion service: A machine learning plat-",
"orig": "Bekas. Corpus conversion service: A machine learning plat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 359.7,
"r_x1": 198.82,
"r_y1": 359.7,
"r_x2": 198.82,
"r_y2": 351.68,
"r_x3": 70.03,
"r_y3": 351.68,
"coord_origin": "TOPLEFT"
},
"text": "form to ingest documents at scale.",
"orig": "form to ingest documents at scale.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.06,
"r_y0": 359.7,
"r_x1": 213.53,
"r_y1": 359.7,
"r_x2": 213.53,
"r_y2": 351.68,
"r_x3": 206.06,
"r_y3": 351.68,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.02,
"r_y0": 359.49,
"r_x1": 286.36,
"r_y1": 359.49,
"r_x2": 286.36,
"r_y2": 351.76,
"r_x3": 217.02,
"r_y3": 351.76,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the",
"orig": "Proceedings of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 370.45,
"r_x1": 143.08,
"r_y1": 370.45,
"r_x2": 143.08,
"r_y2": 362.72,
"r_x3": 70.03,
"r_y3": 362.72,
"coord_origin": "TOPLEFT"
},
"text": "24th ACM SIGKDD",
"orig": "24th ACM SIGKDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.08,
"r_y0": 370.66,
"r_x1": 286.36,
"r_y1": 370.66,
"r_x2": 286.36,
"r_y2": 362.64,
"r_x3": 143.08,
"r_y3": 362.64,
"coord_origin": "TOPLEFT"
},
"text": ", KDD \u201918, pages 774-782, New York,",
"orig": ", KDD \u201918, pages 774-782, New York,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 381.61,
"r_x1": 161.16,
"r_y1": 381.61,
"r_x2": 161.16,
"r_y2": 373.6,
"r_x3": 70.03,
"r_y3": 373.6,
"coord_origin": "TOPLEFT"
},
"text": "NY, USA, 2018. ACM. 1",
"orig": "NY, USA, 2018. ACM. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 392.94,
"r_x1": 65.14,
"r_y1": 392.94,
"r_x2": 65.14,
"r_y2": 384.92,
"r_x3": 50.11,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "[31]",
"orig": "[31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 392.94,
"r_x1": 286.36,
"r_y1": 392.94,
"r_x2": 286.36,
"r_y2": 384.92,
"r_x3": 67.4,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 403.9,
"r_x1": 286.36,
"r_y1": 403.9,
"r_x2": 286.36,
"r_y2": 395.88,
"r_x3": 70.03,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 414.86,
"r_x1": 125.47,
"r_y1": 414.86,
"r_x2": 125.47,
"r_y2": 406.84,
"r_x3": 70.03,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "lia Polosukhin.",
"orig": "lia Polosukhin.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.91,
"r_y0": 414.86,
"r_x1": 230.83,
"r_y1": 414.86,
"r_x2": 230.83,
"r_y2": 406.84,
"r_x3": 133.91,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "Attention is all you need.",
"orig": "Attention is all you need.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.27,
"r_y0": 414.86,
"r_x1": 286.36,
"r_y1": 414.86,
"r_x2": 286.36,
"r_y2": 406.84,
"r_x3": 239.27,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "In I. Guyon,",
"orig": "In I. Guyon,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 425.82,
"r_x1": 78.96,
"r_y1": 425.82,
"r_x2": 78.96,
"r_y2": 417.8,
"r_x3": 70.03,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "U.",
"orig": "U.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.25,
"r_y0": 425.82,
"r_x1": 286.36,
"r_y1": 425.82,
"r_x2": 286.36,
"r_y2": 417.8,
"r_x3": 81.25,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 436.77,
"r_x1": 196.76,
"r_y1": 436.77,
"r_x2": 196.76,
"r_y2": 428.76,
"r_x3": 70.03,
"r_y3": 428.76,
"coord_origin": "TOPLEFT"
},
"text": "wanathan, and R. Garnett, editors,",
"orig": "wanathan, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.2,
"r_y0": 436.57,
"r_x1": 286.36,
"r_y1": 436.57,
"r_x2": 286.36,
"r_y2": 428.84,
"r_x3": 200.2,
"r_y3": 428.84,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural In-",
"orig": "Advances in Neural In-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 447.53,
"r_x1": 189.19,
"r_y1": 447.53,
"r_x2": 189.19,
"r_y2": 439.8,
"r_x3": 70.03,
"r_y3": 439.8,
"coord_origin": "TOPLEFT"
},
"text": "formation Processing Systems 30",
"orig": "formation Processing Systems 30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.2,
"r_y0": 447.73,
"r_x1": 286.36,
"r_y1": 447.73,
"r_x2": 286.36,
"r_y2": 439.72,
"r_x3": 189.2,
"r_y3": 439.72,
"coord_origin": "TOPLEFT"
},
"text": ", pages 5998-6008. Curran",
"orig": ", pages 5998-6008. Curran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 458.69,
"r_x1": 158.92,
"r_y1": 458.69,
"r_x2": 158.92,
"r_y2": 450.68,
"r_x3": 70.03,
"r_y3": 450.68,
"coord_origin": "TOPLEFT"
},
"text": "Associates, Inc., 2017. 5",
"orig": "Associates, Inc., 2017. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 470.02,
"r_x1": 65.91,
"r_y1": 470.02,
"r_x2": 65.91,
"r_y2": 462.0,
"r_x3": 50.11,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "[32]",
"orig": "[32]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.28,
"r_y0": 470.02,
"r_x1": 286.36,
"r_y1": 470.02,
"r_x2": 286.36,
"r_y2": 462.0,
"r_x3": 68.28,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 480.97,
"r_x1": 116.28,
"r_y1": 480.97,
"r_x2": 116.28,
"r_y2": 472.96,
"r_x3": 70.03,
"r_y3": 472.96,
"coord_origin": "TOPLEFT"
},
"text": "mitru Erhan.",
"orig": "mitru Erhan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.48,
"r_y0": 480.97,
"r_x1": 286.36,
"r_y1": 480.97,
"r_x2": 286.36,
"r_y2": 472.96,
"r_x3": 122.48,
"r_y3": 472.96,
"coord_origin": "TOPLEFT"
},
"text": "Show and tell: A neural image caption gen-",
"orig": "Show and tell: A neural image caption gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 491.93,
"r_x1": 103.31,
"r_y1": 491.93,
"r_x2": 103.31,
"r_y2": 483.92,
"r_x3": 70.03,
"r_y3": 483.92,
"coord_origin": "TOPLEFT"
},
"text": "erator. In",
"orig": "erator. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 105.52,
"r_y0": 491.73,
"r_x1": 286.36,
"r_y1": 491.73,
"r_x2": 286.36,
"r_y2": 484.0,
"r_x3": 105.52,
"r_y3": 484.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE Conference on Computer",
"orig": "Proceedings of the IEEE Conference on Computer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 502.69,
"r_x1": 212.52,
"r_y1": 502.69,
"r_x2": 212.52,
"r_y2": 494.96,
"r_x3": 70.03,
"r_y3": 494.96,
"coord_origin": "TOPLEFT"
},
"text": "Vision and Pattern Recognition (CVPR)",
"orig": "Vision and Pattern Recognition (CVPR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.51,
"r_y0": 502.89,
"r_x1": 263.56,
"r_y1": 502.89,
"r_x2": 263.56,
"r_y2": 494.88,
"r_x3": 212.51,
"r_y3": 494.88,
"coord_origin": "TOPLEFT"
},
"text": ", June 2015. 2",
"orig": ", June 2015. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 514.22,
"r_x1": 65.68,
"r_y1": 514.22,
"r_x2": 65.68,
"r_y2": 506.2,
"r_x3": 50.11,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "[33]",
"orig": "[33]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.02,
"r_y0": 514.22,
"r_x1": 247.37,
"r_y1": 514.22,
"r_x2": 247.37,
"r_y2": 506.2,
"r_x3": 68.02,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 253.97,
"r_y0": 514.22,
"r_x1": 286.36,
"r_y1": 514.22,
"r_x2": 286.36,
"r_y2": 506.2,
"r_x3": 253.97,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Res2tim:",
"orig": "Res2tim:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 525.18,
"r_x1": 265.62,
"r_y1": 525.18,
"r_x2": 265.62,
"r_y2": 517.16,
"r_x3": 70.03,
"r_y3": 517.16,
"coord_origin": "TOPLEFT"
},
"text": "reconstruct syntactic structures from table images. In",
"orig": "reconstruct syntactic structures from table images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 268.43,
"r_y0": 524.97,
"r_x1": 286.36,
"r_y1": 524.97,
"r_x2": 286.36,
"r_y2": 517.24,
"r_x3": 268.43,
"r_y3": 517.24,
"coord_origin": "TOPLEFT"
},
"text": "2019",
"orig": "2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 535.93,
"r_x1": 286.36,
"r_y1": 535.93,
"r_x2": 286.36,
"r_y2": 528.2,
"r_x3": 70.03,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Document Analysis and Recog-",
"orig": "International Conference on Document Analysis and Recog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 546.89,
"r_x1": 125.26,
"r_y1": 546.89,
"r_x2": 125.26,
"r_y2": 539.16,
"r_x3": 70.03,
"r_y3": 539.16,
"coord_origin": "TOPLEFT"
},
"text": "nition (ICDAR)",
"orig": "nition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.25,
"r_y0": 547.09,
"r_x1": 240.05,
"r_y1": 547.09,
"r_x2": 240.05,
"r_y2": 539.08,
"r_x3": 125.25,
"r_y3": 539.08,
"coord_origin": "TOPLEFT"
},
"text": ", pages 749-755. IEEE, 2019. 3",
"orig": ", pages 749-755. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 558.42,
"r_x1": 66.04,
"r_y1": 558.42,
"r_x2": 66.04,
"r_y2": 550.4,
"r_x3": 50.11,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "[34]",
"orig": "[34]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.43,
"r_y0": 558.42,
"r_x1": 286.36,
"r_y1": 558.42,
"r_x2": 286.36,
"r_y2": 550.4,
"r_x3": 68.43,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 569.38,
"r_x1": 137.08,
"r_y1": 569.38,
"r_x2": 137.08,
"r_y2": 561.36,
"r_x3": 70.03,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "and Qingyong Li.",
"orig": "and Qingyong Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.99,
"r_y0": 569.38,
"r_x1": 172.38,
"r_y1": 569.38,
"r_x2": 172.38,
"r_y2": 561.36,
"r_x3": 145.99,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "Tgrnet:",
"orig": "Tgrnet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.7,
"r_y0": 569.38,
"r_x1": 286.36,
"r_y1": 569.38,
"r_x2": 286.36,
"r_y2": 561.36,
"r_x3": 178.7,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "A table graph reconstruction",
"orig": "A table graph reconstruction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 580.33,
"r_x1": 221.01,
"r_y1": 580.33,
"r_x2": 221.01,
"r_y2": 572.32,
"r_x3": 70.03,
"r_y3": 572.32,
"coord_origin": "TOPLEFT"
},
"text": "network for table structure recognition.",
"orig": "network for table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.54,
"r_y0": 580.13,
"r_x1": 286.36,
"r_y1": 580.13,
"r_x2": 286.36,
"r_y2": 572.4,
"r_x3": 232.54,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint",
"orig": "arXiv preprint",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 591.09,
"r_x1": 135.53,
"r_y1": 591.09,
"r_x2": 135.53,
"r_y2": 583.36,
"r_x3": 70.03,
"r_y3": 583.36,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2106.10598",
"orig": "arXiv:2106.10598",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.53,
"r_y0": 591.29,
"r_x1": 167.9,
"r_y1": 591.29,
"r_x2": 167.9,
"r_y2": 583.28,
"r_x3": 135.53,
"r_y3": 583.28,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 3",
"orig": ", 2021. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 602.62,
"r_x1": 65.24,
"r_y1": 602.62,
"r_x2": 65.24,
"r_y2": 594.6,
"r_x3": 50.11,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "[35]",
"orig": "[35]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.51,
"r_y0": 602.62,
"r_x1": 286.36,
"r_y1": 602.62,
"r_x2": 286.36,
"r_y2": 594.6,
"r_x3": 67.51,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 613.58,
"r_x1": 109.11,
"r_y1": 613.58,
"r_x2": 109.11,
"r_y2": 605.56,
"r_x3": 70.03,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "Jiebo Luo.",
"orig": "Jiebo Luo.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.23,
"r_y0": 613.58,
"r_x1": 271.77,
"r_y1": 613.58,
"r_x2": 271.77,
"r_y2": 605.56,
"r_x3": 116.23,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "Image captioning with semantic attention.",
"orig": "Image captioning with semantic attention.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.89,
"r_y0": 613.58,
"r_x1": 286.36,
"r_y1": 613.58,
"r_x2": 286.36,
"r_y2": 605.56,
"r_x3": 278.89,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 624.33,
"r_x1": 286.36,
"r_y1": 624.33,
"r_x2": 286.36,
"r_y2": 616.6,
"r_x3": 70.03,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE conference on computer vision and",
"orig": "Proceedings of the IEEE conference on computer vision and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 635.29,
"r_x1": 139.1,
"r_y1": 635.29,
"r_x2": 139.1,
"r_y2": 627.56,
"r_x3": 70.03,
"r_y3": 627.56,
"coord_origin": "TOPLEFT"
},
"text": "pattern recognition",
"orig": "pattern recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 139.1,
"r_y0": 635.49,
"r_x1": 238.96,
"r_y1": 635.49,
"r_x2": 238.96,
"r_y2": 627.48,
"r_x3": 139.1,
"r_y3": 627.48,
"coord_origin": "TOPLEFT"
},
"text": ", pages 4651-4659, 2016. 4",
"orig": ", pages 4651-4659, 2016. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 646.82,
"r_x1": 65.2,
"r_y1": 646.82,
"r_x2": 65.2,
"r_y2": 638.8,
"r_x3": 50.11,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "[36]",
"orig": "[36]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.47,
"r_y0": 646.82,
"r_x1": 286.36,
"r_y1": 646.82,
"r_x2": 286.36,
"r_y2": 638.8,
"r_x3": 67.47,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 657.78,
"r_x1": 286.36,
"r_y1": 657.78,
"r_x2": 286.36,
"r_y2": 649.76,
"r_x3": 70.03,
"r_y3": 649.76,
"coord_origin": "TOPLEFT"
},
"text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 668.74,
"r_x1": 286.36,
"r_y1": 668.74,
"r_x2": 286.36,
"r_y2": 660.72,
"r_x3": 70.03,
"r_y3": 660.72,
"coord_origin": "TOPLEFT"
},
"text": "work for joint table identification and cell structure recogni-",
"orig": "work for joint table identification and cell structure recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 679.69,
"r_x1": 158.46,
"r_y1": 679.69,
"r_x2": 158.46,
"r_y2": 671.68,
"r_x3": 70.03,
"r_y3": 671.68,
"coord_origin": "TOPLEFT"
},
"text": "tion using visual context.",
"orig": "tion using visual context.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.53,
"r_y0": 679.49,
"r_x1": 286.36,
"r_y1": 679.49,
"r_x2": 286.36,
"r_y2": 671.76,
"r_x3": 160.53,
"r_y3": 671.76,
"coord_origin": "TOPLEFT"
},
"text": "Winter Conference for Applications",
"orig": "Winter Conference for Applications",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 690.45,
"r_x1": 171.42,
"r_y1": 690.45,
"r_x2": 171.42,
"r_y2": 682.72,
"r_x3": 70.03,
"r_y3": 682.72,
"coord_origin": "TOPLEFT"
},
"text": "in Computer Vision (WACV)",
"orig": "in Computer Vision (WACV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.42,
"r_y0": 690.65,
"r_x1": 212.76,
"r_y1": 690.65,
"r_x2": 212.76,
"r_y2": 682.64,
"r_x3": 171.42,
"r_y3": 682.64,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 2, 3",
"orig": ", 2021. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.98,
"r_x1": 66.51,
"r_y1": 701.98,
"r_x2": 66.51,
"r_y2": 693.96,
"r_x3": 50.11,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "[37]",
"orig": "[37]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.97,
"r_y0": 701.98,
"r_x1": 80.99,
"r_y1": 701.98,
"r_x2": 80.99,
"r_y2": 693.96,
"r_x3": 68.97,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Xu",
"orig": "Xu",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.06,
"r_y0": 701.98,
"r_x1": 114.71,
"r_y1": 701.98,
"r_x2": 114.71,
"r_y2": 693.96,
"r_x3": 89.06,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Zhong,",
"orig": "Zhong,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.25,
"r_y0": 701.98,
"r_x1": 149.15,
"r_y1": 701.98,
"r_x2": 149.15,
"r_y2": 693.96,
"r_x3": 124.25,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Elaheh",
"orig": "Elaheh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.22,
"r_y0": 701.98,
"r_x1": 209.37,
"r_y1": 701.98,
"r_x2": 209.37,
"r_y2": 693.96,
"r_x3": 157.22,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "ShafieiBavani,",
"orig": "ShafieiBavani,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.9,
"r_y0": 701.98,
"r_x1": 231.85,
"r_y1": 701.98,
"r_x2": 231.85,
"r_y2": 693.96,
"r_x3": 218.9,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.93,
"r_y0": 701.98,
"r_x1": 269.32,
"r_y1": 701.98,
"r_x2": 269.32,
"r_y2": 693.96,
"r_x3": 239.93,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Antonio",
"orig": "Antonio",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 277.39,
"r_y0": 701.98,
"r_x1": 286.36,
"r_y1": 701.98,
"r_x2": 286.36,
"r_y2": 693.96,
"r_x3": 277.39,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Ji-",
"orig": "Ji-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 712.94,
"r_x1": 286.36,
"r_y1": 712.94,
"r_x2": 286.36,
"r_y2": 704.92,
"r_x3": 70.03,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "meno Yepes. Image-based table recognition: Data, model,",
"orig": "meno Yepes. Image-based table recognition: Data, model,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 83.9,
"r_x1": 545.11,
"r_y1": 83.9,
"r_x2": 545.11,
"r_y2": 75.88,
"r_x3": 328.78,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 94.86,
"r_x1": 472.31,
"r_y1": 94.86,
"r_x2": 472.31,
"r_y2": 86.84,
"r_x3": 328.78,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "Brox, and Jan-Michael Frahm, editors,",
"orig": "Brox, and Jan-Michael Frahm, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.89,
"r_y0": 94.65,
"r_x1": 545.11,
"r_y1": 94.65,
"r_x2": 545.11,
"r_y2": 86.92,
"r_x3": 475.89,
"r_y3": 86.92,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision -",
"orig": "Computer Vision -",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 105.61,
"r_x1": 371.93,
"r_y1": 105.61,
"r_x2": 371.93,
"r_y2": 97.88,
"r_x3": 328.78,
"r_y3": 97.88,
"coord_origin": "TOPLEFT"
},
"text": "ECCV 2020",
"orig": "ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.93,
"r_y0": 105.82,
"r_x1": 545.11,
"r_y1": 105.82,
"r_x2": 545.11,
"r_y2": 97.8,
"r_x3": 371.93,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 564-580, Cham, 2020. Springer Interna-",
"orig": ", pages 564-580, Cham, 2020. Springer Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 116.78,
"r_x1": 417.7,
"r_y1": 116.78,
"r_x2": 417.7,
"r_y2": 108.76,
"r_x3": 328.78,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "tional Publishing. 2, 3, 7",
"orig": "tional Publishing. 2, 3, 7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 128.73,
"r_x1": 324.33,
"r_y1": 128.73,
"r_x2": 324.33,
"r_y2": 120.71,
"r_x3": 308.86,
"r_y3": 120.71,
"coord_origin": "TOPLEFT"
},
"text": "[38]",
"orig": "[38]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.65,
"r_y0": 128.73,
"r_x1": 545.11,
"r_y1": 128.73,
"r_x2": 545.11,
"r_y2": 120.71,
"r_x3": 326.65,
"r_y3": 120.71,
"coord_origin": "TOPLEFT"
},
"text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 139.69,
"r_x1": 545.11,
"r_y1": 139.69,
"r_x2": 545.11,
"r_y2": 131.67,
"r_x3": 328.78,
"r_y3": 131.67,
"coord_origin": "TOPLEFT"
},
"text": "laynet: Largest dataset ever for document layout analysis. In",
"orig": "laynet: Largest dataset ever for document layout analysis. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 150.44,
"r_x1": 545.11,
"r_y1": 150.44,
"r_x2": 545.11,
"r_y2": 142.71,
"r_x3": 328.78,
"r_y3": 142.71,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 161.4,
"r_x1": 406.32,
"r_y1": 161.4,
"r_x2": 406.32,
"r_y2": 153.67,
"r_x3": 328.78,
"r_y3": 153.67,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.32,
"r_y0": 161.61,
"r_x1": 506.18,
"r_y1": 161.61,
"r_x2": 506.18,
"r_y2": 153.59,
"r_x3": 406.32,
"r_y3": 153.59,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1015-1022, 2019. 1",
"orig": ", pages 1015-1022, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 15,
"label": "text",
"bbox": {
"l": 70.03,
"t": 75.88,
"r": 286.36,
"b": 94.86,
"coord_origin": "TOPLEFT"
},
"confidence": 0.689,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 83.69,
"r_x1": 223.58,
"r_y1": 83.69,
"r_x2": 223.58,
"r_y2": 75.96,
"r_x3": 70.03,
"r_y3": 75.96,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision and Pattern Recognition",
"orig": "Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 223.58,
"r_y0": 83.9,
"r_x1": 286.36,
"r_y1": 83.9,
"r_x2": 286.36,
"r_y2": 75.88,
"r_x3": 223.58,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": ", pages 658-666,",
"orig": ", pages 658-666,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 94.86,
"r_x1": 97.92,
"r_y1": 94.86,
"r_x2": 97.92,
"r_y2": 86.84,
"r_x3": 70.03,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "2019. 6",
"orig": "2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 98.17,
"r": 286.37,
"b": 160.98,
"coord_origin": "TOPLEFT"
},
"confidence": 0.772,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 106.18,
"r_x1": 65.53,
"r_y1": 106.18,
"r_x2": 65.53,
"r_y2": 98.17,
"r_x3": 50.11,
"r_y3": 98.17,
"coord_origin": "TOPLEFT"
},
"text": "[26]",
"orig": "[26]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.85,
"r_y0": 106.18,
"r_x1": 286.36,
"r_y1": 106.18,
"r_x2": 286.36,
"r_y2": 98.17,
"r_x3": 67.85,
"r_y3": 98.17,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 117.14,
"r_x1": 286.36,
"r_y1": 117.14,
"r_x2": 286.36,
"r_y2": 109.12,
"r_x3": 70.03,
"r_y3": 109.12,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 128.1,
"r_x1": 286.36,
"r_y1": 128.1,
"r_x2": 286.36,
"r_y2": 120.08,
"r_x3": 70.03,
"r_y3": 120.08,
"coord_origin": "TOPLEFT"
},
"text": "tion and structure recognition of tables in document images.",
"orig": "tion and structure recognition of tables in document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 139.06,
"r_x1": 77.5,
"r_y1": 139.06,
"r_x2": 77.5,
"r_y2": 131.04,
"r_x3": 70.03,
"r_y3": 131.04,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 80.56,
"r_y0": 138.85,
"r_x1": 286.37,
"r_y1": 138.85,
"r_x2": 286.37,
"r_y2": 131.12,
"r_x3": 80.56,
"r_y3": 131.12,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR International Conference on Document",
"orig": "2017 14th IAPR International Conference on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 149.81,
"r_x1": 195.23,
"r_y1": 149.81,
"r_x2": 195.23,
"r_y2": 142.08,
"r_x3": 70.03,
"r_y3": 142.08,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (ICDAR)",
"orig": "Analysis and Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.23,
"r_y0": 150.02,
"r_x1": 286.37,
"r_y1": 150.02,
"r_x2": 286.37,
"r_y2": 142.0,
"r_x3": 195.23,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": ", volume 01, pages 1162-",
"orig": ", volume 01, pages 1162-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 160.98,
"r_x1": 120.33,
"r_y1": 160.98,
"r_x2": 120.33,
"r_y2": 152.96,
"r_x3": 70.03,
"r_y3": 152.96,
"coord_origin": "TOPLEFT"
},
"text": "1167, 2017. 1",
"orig": "1167, 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 164.28,
"r": 286.36,
"b": 227.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.858,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 172.3,
"r_x1": 65.53,
"r_y1": 172.3,
"r_x2": 65.53,
"r_y2": 164.28,
"r_x3": 50.11,
"r_y3": 164.28,
"coord_origin": "TOPLEFT"
},
"text": "[27]",
"orig": "[27]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.85,
"r_y0": 172.3,
"r_x1": 286.36,
"r_y1": 172.3,
"r_x2": 286.36,
"r_y2": 164.28,
"r_x3": 67.85,
"r_y3": 164.28,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 183.26,
"r_x1": 286.36,
"r_y1": 183.26,
"r_x2": 286.36,
"r_y2": 175.24,
"r_x3": 70.03,
"r_y3": 175.24,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 194.22,
"r_x1": 286.36,
"r_y1": 194.22,
"r_x2": 286.36,
"r_y2": 186.2,
"r_x3": 70.03,
"r_y3": 186.2,
"coord_origin": "TOPLEFT"
},
"text": "tection and structure recognition of tables in document im-",
"orig": "tection and structure recognition of tables in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 205.18,
"r_x1": 101.33,
"r_y1": 205.18,
"r_x2": 101.33,
"r_y2": 197.16,
"r_x3": 70.03,
"r_y3": 197.16,
"coord_origin": "TOPLEFT"
},
"text": "ages. In",
"orig": "ages. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.33,
"r_y0": 204.97,
"r_x1": 286.36,
"r_y1": 204.97,
"r_x2": 286.36,
"r_y2": 197.24,
"r_x3": 104.33,
"r_y3": 197.24,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR international conference on doc-",
"orig": "2017 14th IAPR international conference on doc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 215.93,
"r_x1": 220.49,
"r_y1": 215.93,
"r_x2": 220.49,
"r_y2": 208.2,
"r_x3": 70.03,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "ument analysis and recognition (ICDAR)",
"orig": "ument analysis and recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.48,
"r_y0": 216.14,
"r_x1": 286.36,
"r_y1": 216.14,
"r_x2": 286.36,
"r_y2": 208.12,
"r_x3": 220.48,
"r_y3": 208.12,
"coord_origin": "TOPLEFT"
},
"text": ", volume 1, pages",
"orig": ", volume 1, pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 227.09,
"r_x1": 166.65,
"r_y1": 227.09,
"r_x2": 166.65,
"r_y2": 219.08,
"r_x3": 70.03,
"r_y3": 219.08,
"coord_origin": "TOPLEFT"
},
"text": "1162-1167. IEEE, 2017. 3",
"orig": "1162-1167. IEEE, 2017. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 230.4,
"r": 286.37,
"b": 271.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.851,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 238.42,
"r_x1": 65.65,
"r_y1": 238.42,
"r_x2": 65.65,
"r_y2": 230.4,
"r_x3": 50.11,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "[28]",
"orig": "[28]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.98,
"r_y0": 238.42,
"r_x1": 286.36,
"r_y1": 238.42,
"r_x2": 286.36,
"r_y2": 230.4,
"r_x3": 67.98,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 249.38,
"r_x1": 147.17,
"r_y1": 249.38,
"r_x2": 147.17,
"r_y2": 241.36,
"r_x3": 70.03,
"r_y3": 241.36,
"coord_origin": "TOPLEFT"
},
"text": "neous documents. In",
"orig": "neous documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.93,
"r_y0": 249.17,
"r_x1": 286.37,
"r_y1": 249.17,
"r_x2": 286.37,
"r_y2": 241.44,
"r_x3": 149.93,
"r_y3": 241.44,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the 9th IAPR Interna-",
"orig": "Proceedings of the 9th IAPR Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 260.13,
"r_x1": 244.69,
"r_y1": 260.13,
"r_x2": 244.69,
"r_y2": 252.4,
"r_x3": 70.03,
"r_y3": 252.4,
"coord_origin": "TOPLEFT"
},
"text": "tional Workshop on Document Analysis Systems",
"orig": "tional Workshop on Document Analysis Systems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 244.69,
"r_y0": 260.34,
"r_x1": 286.36,
"r_y1": 260.34,
"r_x2": 286.36,
"r_y2": 252.32,
"r_x3": 244.69,
"r_y3": 252.32,
"coord_origin": "TOPLEFT"
},
"text": ", pages 65-",
"orig": ", pages 65-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 271.3,
"r_x1": 111.37,
"r_y1": 271.3,
"r_x2": 111.37,
"r_y2": 263.28,
"r_x3": 70.03,
"r_y3": 263.28,
"coord_origin": "TOPLEFT"
},
"text": "72, 2010. 2",
"orig": "72, 2010. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 274.6,
"r": 286.37,
"b": 326.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.849,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 282.62,
"r_x1": 66.02,
"r_y1": 282.62,
"r_x2": 66.02,
"r_y2": 274.6,
"r_x3": 50.11,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "[29]",
"orig": "[29]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.41,
"r_y0": 282.62,
"r_x1": 94.94,
"r_y1": 282.62,
"r_x2": 94.94,
"r_y2": 274.6,
"r_x3": 68.41,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Shoaib",
"orig": "Shoaib",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 100.87,
"r_y0": 282.62,
"r_x1": 127.27,
"r_y1": 282.62,
"r_x2": 127.27,
"r_y2": 274.6,
"r_x3": 100.87,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed",
"orig": "Ahmed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.19,
"r_y0": 282.62,
"r_x1": 165.83,
"r_y1": 282.62,
"r_x2": 165.83,
"r_y2": 274.6,
"r_x3": 133.19,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Siddiqui,",
"orig": "Siddiqui,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 172.68,
"r_y0": 282.62,
"r_x1": 194.09,
"r_y1": 282.62,
"r_x2": 194.09,
"r_y2": 274.6,
"r_x3": 172.68,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Imran",
"orig": "Imran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.02,
"r_y0": 282.62,
"r_x1": 211.48,
"r_y1": 282.62,
"r_x2": 211.48,
"r_y2": 274.6,
"r_x3": 200.02,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ali",
"orig": "Ali",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.41,
"r_y0": 282.62,
"r_x1": 239.44,
"r_y1": 282.62,
"r_x2": 239.44,
"r_y2": 274.6,
"r_x3": 217.41,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Fateh,",
"orig": "Fateh,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.29,
"r_y0": 282.62,
"r_x1": 264.22,
"r_y1": 282.62,
"r_x2": 264.22,
"r_y2": 274.6,
"r_x3": 246.29,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Syed",
"orig": "Syed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.15,
"r_y0": 282.62,
"r_x1": 286.36,
"r_y1": 282.62,
"r_x2": 286.36,
"r_y2": 274.6,
"r_x3": 270.15,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Tah-",
"orig": "Tah-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 293.58,
"r_x1": 286.36,
"r_y1": 293.58,
"r_x2": 286.36,
"r_y2": 285.56,
"r_x3": 70.03,
"r_y3": 285.56,
"coord_origin": "TOPLEFT"
},
"text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 304.54,
"r_x1": 286.36,
"r_y1": 304.54,
"r_x2": 286.36,
"r_y2": 296.52,
"r_x3": 70.03,
"r_y3": 296.52,
"coord_origin": "TOPLEFT"
},
"text": "Deeptabstr: Deep learning based table structure recognition.",
"orig": "Deeptabstr: Deep learning based table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 315.5,
"r_x1": 77.5,
"r_y1": 315.5,
"r_x2": 77.5,
"r_y2": 307.48,
"r_x3": 70.03,
"r_y3": 307.48,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.35,
"r_y0": 315.29,
"r_x1": 286.37,
"r_y1": 315.29,
"r_x2": 286.37,
"r_y2": 307.56,
"r_x3": 79.35,
"r_y3": 307.56,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 326.25,
"r_x1": 147.57,
"r_y1": 326.25,
"r_x2": 147.57,
"r_y2": 318.52,
"r_x3": 70.03,
"r_y3": 318.52,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.57,
"r_y0": 326.45,
"r_x1": 271.34,
"r_y1": 326.45,
"r_x2": 271.34,
"r_y2": 318.44,
"r_x3": 147.57,
"r_y3": 318.44,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1403-1409. IEEE, 2019. 3",
"orig": ", pages 1403-1409. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 329.76,
"r": 286.36,
"b": 381.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 337.78,
"r_x1": 65.37,
"r_y1": 337.78,
"r_x2": 65.37,
"r_y2": 329.76,
"r_x3": 50.11,
"r_y3": 329.76,
"coord_origin": "TOPLEFT"
},
"text": "[30]",
"orig": "[30]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.66,
"r_y0": 337.78,
"r_x1": 286.36,
"r_y1": 337.78,
"r_x2": 286.36,
"r_y2": 329.76,
"r_x3": 67.66,
"r_y3": 329.76,
"coord_origin": "TOPLEFT"
},
"text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 348.74,
"r_x1": 286.36,
"r_y1": 348.74,
"r_x2": 286.36,
"r_y2": 340.72,
"r_x3": 70.03,
"r_y3": 340.72,
"coord_origin": "TOPLEFT"
},
"text": "Bekas. Corpus conversion service: A machine learning plat-",
"orig": "Bekas. Corpus conversion service: A machine learning plat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 359.7,
"r_x1": 198.82,
"r_y1": 359.7,
"r_x2": 198.82,
"r_y2": 351.68,
"r_x3": 70.03,
"r_y3": 351.68,
"coord_origin": "TOPLEFT"
},
"text": "form to ingest documents at scale.",
"orig": "form to ingest documents at scale.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.06,
"r_y0": 359.7,
"r_x1": 213.53,
"r_y1": 359.7,
"r_x2": 213.53,
"r_y2": 351.68,
"r_x3": 206.06,
"r_y3": 351.68,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.02,
"r_y0": 359.49,
"r_x1": 286.36,
"r_y1": 359.49,
"r_x2": 286.36,
"r_y2": 351.76,
"r_x3": 217.02,
"r_y3": 351.76,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the",
"orig": "Proceedings of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 370.45,
"r_x1": 143.08,
"r_y1": 370.45,
"r_x2": 143.08,
"r_y2": 362.72,
"r_x3": 70.03,
"r_y3": 362.72,
"coord_origin": "TOPLEFT"
},
"text": "24th ACM SIGKDD",
"orig": "24th ACM SIGKDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.08,
"r_y0": 370.66,
"r_x1": 286.36,
"r_y1": 370.66,
"r_x2": 286.36,
"r_y2": 362.64,
"r_x3": 143.08,
"r_y3": 362.64,
"coord_origin": "TOPLEFT"
},
"text": ", KDD \u201918, pages 774-782, New York,",
"orig": ", KDD \u201918, pages 774-782, New York,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 381.61,
"r_x1": 161.16,
"r_y1": 381.61,
"r_x2": 161.16,
"r_y2": 373.6,
"r_x3": 70.03,
"r_y3": 373.6,
"coord_origin": "TOPLEFT"
},
"text": "NY, USA, 2018. ACM. 1",
"orig": "NY, USA, 2018. ACM. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 384.92,
"r": 286.36,
"b": 458.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.883,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 392.94,
"r_x1": 65.14,
"r_y1": 392.94,
"r_x2": 65.14,
"r_y2": 384.92,
"r_x3": 50.11,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "[31]",
"orig": "[31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 392.94,
"r_x1": 286.36,
"r_y1": 392.94,
"r_x2": 286.36,
"r_y2": 384.92,
"r_x3": 67.4,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 403.9,
"r_x1": 286.36,
"r_y1": 403.9,
"r_x2": 286.36,
"r_y2": 395.88,
"r_x3": 70.03,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 414.86,
"r_x1": 125.47,
"r_y1": 414.86,
"r_x2": 125.47,
"r_y2": 406.84,
"r_x3": 70.03,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "lia Polosukhin.",
"orig": "lia Polosukhin.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.91,
"r_y0": 414.86,
"r_x1": 230.83,
"r_y1": 414.86,
"r_x2": 230.83,
"r_y2": 406.84,
"r_x3": 133.91,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "Attention is all you need.",
"orig": "Attention is all you need.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.27,
"r_y0": 414.86,
"r_x1": 286.36,
"r_y1": 414.86,
"r_x2": 286.36,
"r_y2": 406.84,
"r_x3": 239.27,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "In I. Guyon,",
"orig": "In I. Guyon,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 425.82,
"r_x1": 78.96,
"r_y1": 425.82,
"r_x2": 78.96,
"r_y2": 417.8,
"r_x3": 70.03,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "U.",
"orig": "U.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.25,
"r_y0": 425.82,
"r_x1": 286.36,
"r_y1": 425.82,
"r_x2": 286.36,
"r_y2": 417.8,
"r_x3": 81.25,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 436.77,
"r_x1": 196.76,
"r_y1": 436.77,
"r_x2": 196.76,
"r_y2": 428.76,
"r_x3": 70.03,
"r_y3": 428.76,
"coord_origin": "TOPLEFT"
},
"text": "wanathan, and R. Garnett, editors,",
"orig": "wanathan, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.2,
"r_y0": 436.57,
"r_x1": 286.36,
"r_y1": 436.57,
"r_x2": 286.36,
"r_y2": 428.84,
"r_x3": 200.2,
"r_y3": 428.84,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural In-",
"orig": "Advances in Neural In-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 447.53,
"r_x1": 189.19,
"r_y1": 447.53,
"r_x2": 189.19,
"r_y2": 439.8,
"r_x3": 70.03,
"r_y3": 439.8,
"coord_origin": "TOPLEFT"
},
"text": "formation Processing Systems 30",
"orig": "formation Processing Systems 30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.2,
"r_y0": 447.73,
"r_x1": 286.36,
"r_y1": 447.73,
"r_x2": 286.36,
"r_y2": 439.72,
"r_x3": 189.2,
"r_y3": 439.72,
"coord_origin": "TOPLEFT"
},
"text": ", pages 5998-6008. Curran",
"orig": ", pages 5998-6008. Curran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 458.69,
"r_x1": 158.92,
"r_y1": 458.69,
"r_x2": 158.92,
"r_y2": 450.68,
"r_x3": 70.03,
"r_y3": 450.68,
"coord_origin": "TOPLEFT"
},
"text": "Associates, Inc., 2017. 5",
"orig": "Associates, Inc., 2017. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 462.0,
"r": 286.36,
"b": 502.89,
"coord_origin": "TOPLEFT"
},
"confidence": 0.843,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 470.02,
"r_x1": 65.91,
"r_y1": 470.02,
"r_x2": 65.91,
"r_y2": 462.0,
"r_x3": 50.11,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "[32]",
"orig": "[32]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.28,
"r_y0": 470.02,
"r_x1": 286.36,
"r_y1": 470.02,
"r_x2": 286.36,
"r_y2": 462.0,
"r_x3": 68.28,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 480.97,
"r_x1": 116.28,
"r_y1": 480.97,
"r_x2": 116.28,
"r_y2": 472.96,
"r_x3": 70.03,
"r_y3": 472.96,
"coord_origin": "TOPLEFT"
},
"text": "mitru Erhan.",
"orig": "mitru Erhan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.48,
"r_y0": 480.97,
"r_x1": 286.36,
"r_y1": 480.97,
"r_x2": 286.36,
"r_y2": 472.96,
"r_x3": 122.48,
"r_y3": 472.96,
"coord_origin": "TOPLEFT"
},
"text": "Show and tell: A neural image caption gen-",
"orig": "Show and tell: A neural image caption gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 491.93,
"r_x1": 103.31,
"r_y1": 491.93,
"r_x2": 103.31,
"r_y2": 483.92,
"r_x3": 70.03,
"r_y3": 483.92,
"coord_origin": "TOPLEFT"
},
"text": "erator. In",
"orig": "erator. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 105.52,
"r_y0": 491.73,
"r_x1": 286.36,
"r_y1": 491.73,
"r_x2": 286.36,
"r_y2": 484.0,
"r_x3": 105.52,
"r_y3": 484.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE Conference on Computer",
"orig": "Proceedings of the IEEE Conference on Computer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 502.69,
"r_x1": 212.52,
"r_y1": 502.69,
"r_x2": 212.52,
"r_y2": 494.96,
"r_x3": 70.03,
"r_y3": 494.96,
"coord_origin": "TOPLEFT"
},
"text": "Vision and Pattern Recognition (CVPR)",
"orig": "Vision and Pattern Recognition (CVPR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.51,
"r_y0": 502.89,
"r_x1": 263.56,
"r_y1": 502.89,
"r_x2": 263.56,
"r_y2": 494.88,
"r_x3": 212.51,
"r_y3": 494.88,
"coord_origin": "TOPLEFT"
},
"text": ", June 2015. 2",
"orig": ", June 2015. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 506.2,
"r": 286.36,
"b": 547.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.841,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 514.22,
"r_x1": 65.68,
"r_y1": 514.22,
"r_x2": 65.68,
"r_y2": 506.2,
"r_x3": 50.11,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "[33]",
"orig": "[33]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.02,
"r_y0": 514.22,
"r_x1": 247.37,
"r_y1": 514.22,
"r_x2": 247.37,
"r_y2": 506.2,
"r_x3": 68.02,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 253.97,
"r_y0": 514.22,
"r_x1": 286.36,
"r_y1": 514.22,
"r_x2": 286.36,
"r_y2": 506.2,
"r_x3": 253.97,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Res2tim:",
"orig": "Res2tim:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 525.18,
"r_x1": 265.62,
"r_y1": 525.18,
"r_x2": 265.62,
"r_y2": 517.16,
"r_x3": 70.03,
"r_y3": 517.16,
"coord_origin": "TOPLEFT"
},
"text": "reconstruct syntactic structures from table images. In",
"orig": "reconstruct syntactic structures from table images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 268.43,
"r_y0": 524.97,
"r_x1": 286.36,
"r_y1": 524.97,
"r_x2": 286.36,
"r_y2": 517.24,
"r_x3": 268.43,
"r_y3": 517.24,
"coord_origin": "TOPLEFT"
},
"text": "2019",
"orig": "2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 535.93,
"r_x1": 286.36,
"r_y1": 535.93,
"r_x2": 286.36,
"r_y2": 528.2,
"r_x3": 70.03,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Document Analysis and Recog-",
"orig": "International Conference on Document Analysis and Recog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 546.89,
"r_x1": 125.26,
"r_y1": 546.89,
"r_x2": 125.26,
"r_y2": 539.16,
"r_x3": 70.03,
"r_y3": 539.16,
"coord_origin": "TOPLEFT"
},
"text": "nition (ICDAR)",
"orig": "nition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.25,
"r_y0": 547.09,
"r_x1": 240.05,
"r_y1": 547.09,
"r_x2": 240.05,
"r_y2": 539.08,
"r_x3": 125.25,
"r_y3": 539.08,
"coord_origin": "TOPLEFT"
},
"text": ", pages 749-755. IEEE, 2019. 3",
"orig": ", pages 749-755. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 550.4,
"r": 286.36,
"b": 591.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.824,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 558.42,
"r_x1": 66.04,
"r_y1": 558.42,
"r_x2": 66.04,
"r_y2": 550.4,
"r_x3": 50.11,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "[34]",
"orig": "[34]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.43,
"r_y0": 558.42,
"r_x1": 286.36,
"r_y1": 558.42,
"r_x2": 286.36,
"r_y2": 550.4,
"r_x3": 68.43,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 569.38,
"r_x1": 137.08,
"r_y1": 569.38,
"r_x2": 137.08,
"r_y2": 561.36,
"r_x3": 70.03,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "and Qingyong Li.",
"orig": "and Qingyong Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.99,
"r_y0": 569.38,
"r_x1": 172.38,
"r_y1": 569.38,
"r_x2": 172.38,
"r_y2": 561.36,
"r_x3": 145.99,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "Tgrnet:",
"orig": "Tgrnet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.7,
"r_y0": 569.38,
"r_x1": 286.36,
"r_y1": 569.38,
"r_x2": 286.36,
"r_y2": 561.36,
"r_x3": 178.7,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "A table graph reconstruction",
"orig": "A table graph reconstruction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 580.33,
"r_x1": 221.01,
"r_y1": 580.33,
"r_x2": 221.01,
"r_y2": 572.32,
"r_x3": 70.03,
"r_y3": 572.32,
"coord_origin": "TOPLEFT"
},
"text": "network for table structure recognition.",
"orig": "network for table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.54,
"r_y0": 580.13,
"r_x1": 286.36,
"r_y1": 580.13,
"r_x2": 286.36,
"r_y2": 572.4,
"r_x3": 232.54,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint",
"orig": "arXiv preprint",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 591.09,
"r_x1": 135.53,
"r_y1": 591.09,
"r_x2": 135.53,
"r_y2": 583.36,
"r_x3": 70.03,
"r_y3": 583.36,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2106.10598",
"orig": "arXiv:2106.10598",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.53,
"r_y0": 591.29,
"r_x1": 167.9,
"r_y1": 591.29,
"r_x2": 167.9,
"r_y2": 583.28,
"r_x3": 135.53,
"r_y3": 583.28,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 3",
"orig": ", 2021. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 594.6,
"r": 286.36,
"b": 635.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.836,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 602.62,
"r_x1": 65.24,
"r_y1": 602.62,
"r_x2": 65.24,
"r_y2": 594.6,
"r_x3": 50.11,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "[35]",
"orig": "[35]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.51,
"r_y0": 602.62,
"r_x1": 286.36,
"r_y1": 602.62,
"r_x2": 286.36,
"r_y2": 594.6,
"r_x3": 67.51,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 613.58,
"r_x1": 109.11,
"r_y1": 613.58,
"r_x2": 109.11,
"r_y2": 605.56,
"r_x3": 70.03,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "Jiebo Luo.",
"orig": "Jiebo Luo.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.23,
"r_y0": 613.58,
"r_x1": 271.77,
"r_y1": 613.58,
"r_x2": 271.77,
"r_y2": 605.56,
"r_x3": 116.23,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "Image captioning with semantic attention.",
"orig": "Image captioning with semantic attention.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.89,
"r_y0": 613.58,
"r_x1": 286.36,
"r_y1": 613.58,
"r_x2": 286.36,
"r_y2": 605.56,
"r_x3": 278.89,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 624.33,
"r_x1": 286.36,
"r_y1": 624.33,
"r_x2": 286.36,
"r_y2": 616.6,
"r_x3": 70.03,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE conference on computer vision and",
"orig": "Proceedings of the IEEE conference on computer vision and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 635.29,
"r_x1": 139.1,
"r_y1": 635.29,
"r_x2": 139.1,
"r_y2": 627.56,
"r_x3": 70.03,
"r_y3": 627.56,
"coord_origin": "TOPLEFT"
},
"text": "pattern recognition",
"orig": "pattern recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 139.1,
"r_y0": 635.49,
"r_x1": 238.96,
"r_y1": 635.49,
"r_x2": 238.96,
"r_y2": 627.48,
"r_x3": 139.1,
"r_y3": 627.48,
"coord_origin": "TOPLEFT"
},
"text": ", pages 4651-4659, 2016. 4",
"orig": ", pages 4651-4659, 2016. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 638.8,
"r": 286.36,
"b": 690.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.808,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 646.82,
"r_x1": 65.2,
"r_y1": 646.82,
"r_x2": 65.2,
"r_y2": 638.8,
"r_x3": 50.11,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "[36]",
"orig": "[36]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.47,
"r_y0": 646.82,
"r_x1": 286.36,
"r_y1": 646.82,
"r_x2": 286.36,
"r_y2": 638.8,
"r_x3": 67.47,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 657.78,
"r_x1": 286.36,
"r_y1": 657.78,
"r_x2": 286.36,
"r_y2": 649.76,
"r_x3": 70.03,
"r_y3": 649.76,
"coord_origin": "TOPLEFT"
},
"text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 668.74,
"r_x1": 286.36,
"r_y1": 668.74,
"r_x2": 286.36,
"r_y2": 660.72,
"r_x3": 70.03,
"r_y3": 660.72,
"coord_origin": "TOPLEFT"
},
"text": "work for joint table identification and cell structure recogni-",
"orig": "work for joint table identification and cell structure recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 679.69,
"r_x1": 158.46,
"r_y1": 679.69,
"r_x2": 158.46,
"r_y2": 671.68,
"r_x3": 70.03,
"r_y3": 671.68,
"coord_origin": "TOPLEFT"
},
"text": "tion using visual context.",
"orig": "tion using visual context.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.53,
"r_y0": 679.49,
"r_x1": 286.36,
"r_y1": 679.49,
"r_x2": 286.36,
"r_y2": 671.76,
"r_x3": 160.53,
"r_y3": 671.76,
"coord_origin": "TOPLEFT"
},
"text": "Winter Conference for Applications",
"orig": "Winter Conference for Applications",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 690.45,
"r_x1": 171.42,
"r_y1": 690.45,
"r_x2": 171.42,
"r_y2": 682.72,
"r_x3": 70.03,
"r_y3": 682.72,
"coord_origin": "TOPLEFT"
},
"text": "in Computer Vision (WACV)",
"orig": "in Computer Vision (WACV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.42,
"r_y0": 690.65,
"r_x1": 212.76,
"r_y1": 690.65,
"r_x2": 212.76,
"r_y2": 682.64,
"r_x3": 171.42,
"r_y3": 682.64,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 2, 3",
"orig": ", 2021. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 693.96,
"r": 286.36,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.839,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.98,
"r_x1": 66.51,
"r_y1": 701.98,
"r_x2": 66.51,
"r_y2": 693.96,
"r_x3": 50.11,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "[37]",
"orig": "[37]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.97,
"r_y0": 701.98,
"r_x1": 80.99,
"r_y1": 701.98,
"r_x2": 80.99,
"r_y2": 693.96,
"r_x3": 68.97,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Xu",
"orig": "Xu",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.06,
"r_y0": 701.98,
"r_x1": 114.71,
"r_y1": 701.98,
"r_x2": 114.71,
"r_y2": 693.96,
"r_x3": 89.06,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Zhong,",
"orig": "Zhong,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.25,
"r_y0": 701.98,
"r_x1": 149.15,
"r_y1": 701.98,
"r_x2": 149.15,
"r_y2": 693.96,
"r_x3": 124.25,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Elaheh",
"orig": "Elaheh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.22,
"r_y0": 701.98,
"r_x1": 209.37,
"r_y1": 701.98,
"r_x2": 209.37,
"r_y2": 693.96,
"r_x3": 157.22,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "ShafieiBavani,",
"orig": "ShafieiBavani,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.9,
"r_y0": 701.98,
"r_x1": 231.85,
"r_y1": 701.98,
"r_x2": 231.85,
"r_y2": 693.96,
"r_x3": 218.9,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.93,
"r_y0": 701.98,
"r_x1": 269.32,
"r_y1": 701.98,
"r_x2": 269.32,
"r_y2": 693.96,
"r_x3": 239.93,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Antonio",
"orig": "Antonio",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 277.39,
"r_y0": 701.98,
"r_x1": 286.36,
"r_y1": 701.98,
"r_x2": 286.36,
"r_y2": 693.96,
"r_x3": 277.39,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Ji-",
"orig": "Ji-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 712.94,
"r_x1": 286.36,
"r_y1": 712.94,
"r_x2": 286.36,
"r_y2": 704.92,
"r_x3": 70.03,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "meno Yepes. Image-based table recognition: Data, model,",
"orig": "meno Yepes. Image-based table recognition: Data, model,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "list_item",
"bbox": {
"l": 328.78,
"t": 75.88,
"r": 545.11,
"b": 116.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.756,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 83.9,
"r_x1": 545.11,
"r_y1": 83.9,
"r_x2": 545.11,
"r_y2": 75.88,
"r_x3": 328.78,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 94.86,
"r_x1": 472.31,
"r_y1": 94.86,
"r_x2": 472.31,
"r_y2": 86.84,
"r_x3": 328.78,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "Brox, and Jan-Michael Frahm, editors,",
"orig": "Brox, and Jan-Michael Frahm, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.89,
"r_y0": 94.65,
"r_x1": 545.11,
"r_y1": 94.65,
"r_x2": 545.11,
"r_y2": 86.92,
"r_x3": 475.89,
"r_y3": 86.92,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision -",
"orig": "Computer Vision -",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 105.61,
"r_x1": 371.93,
"r_y1": 105.61,
"r_x2": 371.93,
"r_y2": 97.88,
"r_x3": 328.78,
"r_y3": 97.88,
"coord_origin": "TOPLEFT"
},
"text": "ECCV 2020",
"orig": "ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.93,
"r_y0": 105.82,
"r_x1": 545.11,
"r_y1": 105.82,
"r_x2": 545.11,
"r_y2": 97.8,
"r_x3": 371.93,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 564-580, Cham, 2020. Springer Interna-",
"orig": ", pages 564-580, Cham, 2020. Springer Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 116.78,
"r_x1": 417.7,
"r_y1": 116.78,
"r_x2": 417.7,
"r_y2": 108.76,
"r_x3": 328.78,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "tional Publishing. 2, 3, 7",
"orig": "tional Publishing. 2, 3, 7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 120.71,
"r": 545.11,
"b": 161.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.838,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 128.73,
"r_x1": 324.33,
"r_y1": 128.73,
"r_x2": 324.33,
"r_y2": 120.71,
"r_x3": 308.86,
"r_y3": 120.71,
"coord_origin": "TOPLEFT"
},
"text": "[38]",
"orig": "[38]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.65,
"r_y0": 128.73,
"r_x1": 545.11,
"r_y1": 128.73,
"r_x2": 545.11,
"r_y2": 120.71,
"r_x3": 326.65,
"r_y3": 120.71,
"coord_origin": "TOPLEFT"
},
"text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 139.69,
"r_x1": 545.11,
"r_y1": 139.69,
"r_x2": 545.11,
"r_y2": 131.67,
"r_x3": 328.78,
"r_y3": 131.67,
"coord_origin": "TOPLEFT"
},
"text": "laynet: Largest dataset ever for document layout analysis. In",
"orig": "laynet: Largest dataset ever for document layout analysis. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 150.44,
"r_x1": 545.11,
"r_y1": 150.44,
"r_x2": 545.11,
"r_y2": 142.71,
"r_x3": 328.78,
"r_y3": 142.71,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 161.4,
"r_x1": 406.32,
"r_y1": 161.4,
"r_x2": 406.32,
"r_y2": 153.67,
"r_x3": 328.78,
"r_y3": 153.67,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.32,
"r_y0": 161.61,
"r_x1": 506.18,
"r_y1": 161.61,
"r_x2": 506.18,
"r_y2": 153.59,
"r_x3": 406.32,
"r_y3": 153.59,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1015-1022, 2019. 1",
"orig": ", pages 1015-1022, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.907,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 15,
"page_no": 9,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 70.03,
"t": 75.88,
"r": 286.36,
"b": 94.86,
"coord_origin": "TOPLEFT"
},
"confidence": 0.689,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 83.69,
"r_x1": 223.58,
"r_y1": 83.69,
"r_x2": 223.58,
"r_y2": 75.96,
"r_x3": 70.03,
"r_y3": 75.96,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision and Pattern Recognition",
"orig": "Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 223.58,
"r_y0": 83.9,
"r_x1": 286.36,
"r_y1": 83.9,
"r_x2": 286.36,
"r_y2": 75.88,
"r_x3": 223.58,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": ", pages 658-666,",
"orig": ", pages 658-666,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 94.86,
"r_x1": 97.92,
"r_y1": 94.86,
"r_x2": 97.92,
"r_y2": 86.84,
"r_x3": 70.03,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "2019. 6",
"orig": "2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6"
},
{
"label": "list_item",
"id": 13,
"page_no": 9,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 98.17,
"r": 286.37,
"b": 160.98,
"coord_origin": "TOPLEFT"
},
"confidence": 0.772,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 106.18,
"r_x1": 65.53,
"r_y1": 106.18,
"r_x2": 65.53,
"r_y2": 98.17,
"r_x3": 50.11,
"r_y3": 98.17,
"coord_origin": "TOPLEFT"
},
"text": "[26]",
"orig": "[26]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.85,
"r_y0": 106.18,
"r_x1": 286.36,
"r_y1": 106.18,
"r_x2": 286.36,
"r_y2": 98.17,
"r_x3": 67.85,
"r_y3": 98.17,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 117.14,
"r_x1": 286.36,
"r_y1": 117.14,
"r_x2": 286.36,
"r_y2": 109.12,
"r_x3": 70.03,
"r_y3": 109.12,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 128.1,
"r_x1": 286.36,
"r_y1": 128.1,
"r_x2": 286.36,
"r_y2": 120.08,
"r_x3": 70.03,
"r_y3": 120.08,
"coord_origin": "TOPLEFT"
},
"text": "tion and structure recognition of tables in document images.",
"orig": "tion and structure recognition of tables in document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 139.06,
"r_x1": 77.5,
"r_y1": 139.06,
"r_x2": 77.5,
"r_y2": 131.04,
"r_x3": 70.03,
"r_y3": 131.04,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 80.56,
"r_y0": 138.85,
"r_x1": 286.37,
"r_y1": 138.85,
"r_x2": 286.37,
"r_y2": 131.12,
"r_x3": 80.56,
"r_y3": 131.12,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR International Conference on Document",
"orig": "2017 14th IAPR International Conference on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 149.81,
"r_x1": 195.23,
"r_y1": 149.81,
"r_x2": 195.23,
"r_y2": 142.08,
"r_x3": 70.03,
"r_y3": 142.08,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (ICDAR)",
"orig": "Analysis and Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.23,
"r_y0": 150.02,
"r_x1": 286.37,
"r_y1": 150.02,
"r_x2": 286.37,
"r_y2": 142.0,
"r_x3": 195.23,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": ", volume 01, pages 1162-",
"orig": ", volume 01, pages 1162-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 160.98,
"r_x1": 120.33,
"r_y1": 160.98,
"r_x2": 120.33,
"r_y2": 152.96,
"r_x3": 70.03,
"r_y3": 152.96,
"coord_origin": "TOPLEFT"
},
"text": "1167, 2017. 1",
"orig": "1167, 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1"
},
{
"label": "list_item",
"id": 2,
"page_no": 9,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 164.28,
"r": 286.36,
"b": 227.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.858,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 172.3,
"r_x1": 65.53,
"r_y1": 172.3,
"r_x2": 65.53,
"r_y2": 164.28,
"r_x3": 50.11,
"r_y3": 164.28,
"coord_origin": "TOPLEFT"
},
"text": "[27]",
"orig": "[27]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.85,
"r_y0": 172.3,
"r_x1": 286.36,
"r_y1": 172.3,
"r_x2": 286.36,
"r_y2": 164.28,
"r_x3": 67.85,
"r_y3": 164.28,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 183.26,
"r_x1": 286.36,
"r_y1": 183.26,
"r_x2": 286.36,
"r_y2": 175.24,
"r_x3": 70.03,
"r_y3": 175.24,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 194.22,
"r_x1": 286.36,
"r_y1": 194.22,
"r_x2": 286.36,
"r_y2": 186.2,
"r_x3": 70.03,
"r_y3": 186.2,
"coord_origin": "TOPLEFT"
},
"text": "tection and structure recognition of tables in document im-",
"orig": "tection and structure recognition of tables in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 205.18,
"r_x1": 101.33,
"r_y1": 205.18,
"r_x2": 101.33,
"r_y2": 197.16,
"r_x3": 70.03,
"r_y3": 197.16,
"coord_origin": "TOPLEFT"
},
"text": "ages. In",
"orig": "ages. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.33,
"r_y0": 204.97,
"r_x1": 286.36,
"r_y1": 204.97,
"r_x2": 286.36,
"r_y2": 197.24,
"r_x3": 104.33,
"r_y3": 197.24,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR international conference on doc-",
"orig": "2017 14th IAPR international conference on doc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 215.93,
"r_x1": 220.49,
"r_y1": 215.93,
"r_x2": 220.49,
"r_y2": 208.2,
"r_x3": 70.03,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "ument analysis and recognition (ICDAR)",
"orig": "ument analysis and recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.48,
"r_y0": 216.14,
"r_x1": 286.36,
"r_y1": 216.14,
"r_x2": 286.36,
"r_y2": 208.12,
"r_x3": 220.48,
"r_y3": 208.12,
"coord_origin": "TOPLEFT"
},
"text": ", volume 1, pages",
"orig": ", volume 1, pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 227.09,
"r_x1": 166.65,
"r_y1": 227.09,
"r_x2": 166.65,
"r_y2": 219.08,
"r_x3": 70.03,
"r_y3": 219.08,
"coord_origin": "TOPLEFT"
},
"text": "1162-1167. IEEE, 2017. 3",
"orig": "1162-1167. IEEE, 2017. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3"
},
{
"label": "list_item",
"id": 4,
"page_no": 9,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 230.4,
"r": 286.37,
"b": 271.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.851,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 238.42,
"r_x1": 65.65,
"r_y1": 238.42,
"r_x2": 65.65,
"r_y2": 230.4,
"r_x3": 50.11,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "[28]",
"orig": "[28]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.98,
"r_y0": 238.42,
"r_x1": 286.36,
"r_y1": 238.42,
"r_x2": 286.36,
"r_y2": 230.4,
"r_x3": 67.98,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 249.38,
"r_x1": 147.17,
"r_y1": 249.38,
"r_x2": 147.17,
"r_y2": 241.36,
"r_x3": 70.03,
"r_y3": 241.36,
"coord_origin": "TOPLEFT"
},
"text": "neous documents. In",
"orig": "neous documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.93,
"r_y0": 249.17,
"r_x1": 286.37,
"r_y1": 249.17,
"r_x2": 286.37,
"r_y2": 241.44,
"r_x3": 149.93,
"r_y3": 241.44,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the 9th IAPR Interna-",
"orig": "Proceedings of the 9th IAPR Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 260.13,
"r_x1": 244.69,
"r_y1": 260.13,
"r_x2": 244.69,
"r_y2": 252.4,
"r_x3": 70.03,
"r_y3": 252.4,
"coord_origin": "TOPLEFT"
},
"text": "tional Workshop on Document Analysis Systems",
"orig": "tional Workshop on Document Analysis Systems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 244.69,
"r_y0": 260.34,
"r_x1": 286.36,
"r_y1": 260.34,
"r_x2": 286.36,
"r_y2": 252.32,
"r_x3": 244.69,
"r_y3": 252.32,
"coord_origin": "TOPLEFT"
},
"text": ", pages 65-",
"orig": ", pages 65-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 271.3,
"r_x1": 111.37,
"r_y1": 271.3,
"r_x2": 111.37,
"r_y2": 263.28,
"r_x3": 70.03,
"r_y3": 263.28,
"coord_origin": "TOPLEFT"
},
"text": "72, 2010. 2",
"orig": "72, 2010. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2"
},
{
"label": "list_item",
"id": 5,
"page_no": 9,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 274.6,
"r": 286.37,
"b": 326.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.849,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 282.62,
"r_x1": 66.02,
"r_y1": 282.62,
"r_x2": 66.02,
"r_y2": 274.6,
"r_x3": 50.11,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "[29]",
"orig": "[29]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.41,
"r_y0": 282.62,
"r_x1": 94.94,
"r_y1": 282.62,
"r_x2": 94.94,
"r_y2": 274.6,
"r_x3": 68.41,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Shoaib",
"orig": "Shoaib",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 100.87,
"r_y0": 282.62,
"r_x1": 127.27,
"r_y1": 282.62,
"r_x2": 127.27,
"r_y2": 274.6,
"r_x3": 100.87,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed",
"orig": "Ahmed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.19,
"r_y0": 282.62,
"r_x1": 165.83,
"r_y1": 282.62,
"r_x2": 165.83,
"r_y2": 274.6,
"r_x3": 133.19,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Siddiqui,",
"orig": "Siddiqui,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 172.68,
"r_y0": 282.62,
"r_x1": 194.09,
"r_y1": 282.62,
"r_x2": 194.09,
"r_y2": 274.6,
"r_x3": 172.68,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Imran",
"orig": "Imran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.02,
"r_y0": 282.62,
"r_x1": 211.48,
"r_y1": 282.62,
"r_x2": 211.48,
"r_y2": 274.6,
"r_x3": 200.02,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ali",
"orig": "Ali",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.41,
"r_y0": 282.62,
"r_x1": 239.44,
"r_y1": 282.62,
"r_x2": 239.44,
"r_y2": 274.6,
"r_x3": 217.41,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Fateh,",
"orig": "Fateh,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.29,
"r_y0": 282.62,
"r_x1": 264.22,
"r_y1": 282.62,
"r_x2": 264.22,
"r_y2": 274.6,
"r_x3": 246.29,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Syed",
"orig": "Syed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.15,
"r_y0": 282.62,
"r_x1": 286.36,
"r_y1": 282.62,
"r_x2": 286.36,
"r_y2": 274.6,
"r_x3": 270.15,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Tah-",
"orig": "Tah-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 293.58,
"r_x1": 286.36,
"r_y1": 293.58,
"r_x2": 286.36,
"r_y2": 285.56,
"r_x3": 70.03,
"r_y3": 285.56,
"coord_origin": "TOPLEFT"
},
"text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 304.54,
"r_x1": 286.36,
"r_y1": 304.54,
"r_x2": 286.36,
"r_y2": 296.52,
"r_x3": 70.03,
"r_y3": 296.52,
"coord_origin": "TOPLEFT"
},
"text": "Deeptabstr: Deep learning based table structure recognition.",
"orig": "Deeptabstr: Deep learning based table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 315.5,
"r_x1": 77.5,
"r_y1": 315.5,
"r_x2": 77.5,
"r_y2": 307.48,
"r_x3": 70.03,
"r_y3": 307.48,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.35,
"r_y0": 315.29,
"r_x1": 286.37,
"r_y1": 315.29,
"r_x2": 286.37,
"r_y2": 307.56,
"r_x3": 79.35,
"r_y3": 307.56,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 326.25,
"r_x1": 147.57,
"r_y1": 326.25,
"r_x2": 147.57,
"r_y2": 318.52,
"r_x3": 70.03,
"r_y3": 318.52,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.57,
"r_y0": 326.45,
"r_x1": 271.34,
"r_y1": 326.45,
"r_x2": 271.34,
"r_y2": 318.44,
"r_x3": 147.57,
"r_y3": 318.44,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1403-1409. IEEE, 2019. 3",
"orig": ", pages 1403-1409. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 3,
"page_no": 9,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 329.76,
"r": 286.36,
"b": 381.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 337.78,
"r_x1": 65.37,
"r_y1": 337.78,
"r_x2": 65.37,
"r_y2": 329.76,
"r_x3": 50.11,
"r_y3": 329.76,
"coord_origin": "TOPLEFT"
},
"text": "[30]",
"orig": "[30]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.66,
"r_y0": 337.78,
"r_x1": 286.36,
"r_y1": 337.78,
"r_x2": 286.36,
"r_y2": 329.76,
"r_x3": 67.66,
"r_y3": 329.76,
"coord_origin": "TOPLEFT"
},
"text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 348.74,
"r_x1": 286.36,
"r_y1": 348.74,
"r_x2": 286.36,
"r_y2": 340.72,
"r_x3": 70.03,
"r_y3": 340.72,
"coord_origin": "TOPLEFT"
},
"text": "Bekas. Corpus conversion service: A machine learning plat-",
"orig": "Bekas. Corpus conversion service: A machine learning plat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 359.7,
"r_x1": 198.82,
"r_y1": 359.7,
"r_x2": 198.82,
"r_y2": 351.68,
"r_x3": 70.03,
"r_y3": 351.68,
"coord_origin": "TOPLEFT"
},
"text": "form to ingest documents at scale.",
"orig": "form to ingest documents at scale.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.06,
"r_y0": 359.7,
"r_x1": 213.53,
"r_y1": 359.7,
"r_x2": 213.53,
"r_y2": 351.68,
"r_x3": 206.06,
"r_y3": 351.68,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.02,
"r_y0": 359.49,
"r_x1": 286.36,
"r_y1": 359.49,
"r_x2": 286.36,
"r_y2": 351.76,
"r_x3": 217.02,
"r_y3": 351.76,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the",
"orig": "Proceedings of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 370.45,
"r_x1": 143.08,
"r_y1": 370.45,
"r_x2": 143.08,
"r_y2": 362.72,
"r_x3": 70.03,
"r_y3": 362.72,
"coord_origin": "TOPLEFT"
},
"text": "24th ACM SIGKDD",
"orig": "24th ACM SIGKDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.08,
"r_y0": 370.66,
"r_x1": 286.36,
"r_y1": 370.66,
"r_x2": 286.36,
"r_y2": 362.64,
"r_x3": 143.08,
"r_y3": 362.64,
"coord_origin": "TOPLEFT"
},
"text": ", KDD \u201918, pages 774-782, New York,",
"orig": ", KDD \u201918, pages 774-782, New York,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 381.61,
"r_x1": 161.16,
"r_y1": 381.61,
"r_x2": 161.16,
"r_y2": 373.6,
"r_x3": 70.03,
"r_y3": 373.6,
"coord_origin": "TOPLEFT"
},
"text": "NY, USA, 2018. ACM. 1",
"orig": "NY, USA, 2018. ACM. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[30] Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1"
},
{
"label": "list_item",
"id": 1,
"page_no": 9,
"cluster": {
"id": 1,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 384.92,
"r": 286.36,
"b": 458.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.883,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 392.94,
"r_x1": 65.14,
"r_y1": 392.94,
"r_x2": 65.14,
"r_y2": 384.92,
"r_x3": 50.11,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "[31]",
"orig": "[31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 392.94,
"r_x1": 286.36,
"r_y1": 392.94,
"r_x2": 286.36,
"r_y2": 384.92,
"r_x3": 67.4,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 403.9,
"r_x1": 286.36,
"r_y1": 403.9,
"r_x2": 286.36,
"r_y2": 395.88,
"r_x3": 70.03,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 414.86,
"r_x1": 125.47,
"r_y1": 414.86,
"r_x2": 125.47,
"r_y2": 406.84,
"r_x3": 70.03,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "lia Polosukhin.",
"orig": "lia Polosukhin.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.91,
"r_y0": 414.86,
"r_x1": 230.83,
"r_y1": 414.86,
"r_x2": 230.83,
"r_y2": 406.84,
"r_x3": 133.91,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "Attention is all you need.",
"orig": "Attention is all you need.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.27,
"r_y0": 414.86,
"r_x1": 286.36,
"r_y1": 414.86,
"r_x2": 286.36,
"r_y2": 406.84,
"r_x3": 239.27,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "In I. Guyon,",
"orig": "In I. Guyon,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 425.82,
"r_x1": 78.96,
"r_y1": 425.82,
"r_x2": 78.96,
"r_y2": 417.8,
"r_x3": 70.03,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "U.",
"orig": "U.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.25,
"r_y0": 425.82,
"r_x1": 286.36,
"r_y1": 425.82,
"r_x2": 286.36,
"r_y2": 417.8,
"r_x3": 81.25,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 436.77,
"r_x1": 196.76,
"r_y1": 436.77,
"r_x2": 196.76,
"r_y2": 428.76,
"r_x3": 70.03,
"r_y3": 428.76,
"coord_origin": "TOPLEFT"
},
"text": "wanathan, and R. Garnett, editors,",
"orig": "wanathan, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.2,
"r_y0": 436.57,
"r_x1": 286.36,
"r_y1": 436.57,
"r_x2": 286.36,
"r_y2": 428.84,
"r_x3": 200.2,
"r_y3": 428.84,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural In-",
"orig": "Advances in Neural In-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 447.53,
"r_x1": 189.19,
"r_y1": 447.53,
"r_x2": 189.19,
"r_y2": 439.8,
"r_x3": 70.03,
"r_y3": 439.8,
"coord_origin": "TOPLEFT"
},
"text": "formation Processing Systems 30",
"orig": "formation Processing Systems 30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.2,
"r_y0": 447.73,
"r_x1": 286.36,
"r_y1": 447.73,
"r_x2": 286.36,
"r_y2": 439.72,
"r_x3": 189.2,
"r_y3": 439.72,
"coord_origin": "TOPLEFT"
},
"text": ", pages 5998-6008. Curran",
"orig": ", pages 5998-6008. Curran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 458.69,
"r_x1": 158.92,
"r_y1": 458.69,
"r_x2": 158.92,
"r_y2": 450.68,
"r_x3": 70.03,
"r_y3": 450.68,
"coord_origin": "TOPLEFT"
},
"text": "Associates, Inc., 2017. 5",
"orig": "Associates, Inc., 2017. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5"
},
{
"label": "list_item",
"id": 6,
"page_no": 9,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 462.0,
"r": 286.36,
"b": 502.89,
"coord_origin": "TOPLEFT"
},
"confidence": 0.843,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 470.02,
"r_x1": 65.91,
"r_y1": 470.02,
"r_x2": 65.91,
"r_y2": 462.0,
"r_x3": 50.11,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "[32]",
"orig": "[32]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.28,
"r_y0": 470.02,
"r_x1": 286.36,
"r_y1": 470.02,
"r_x2": 286.36,
"r_y2": 462.0,
"r_x3": 68.28,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 480.97,
"r_x1": 116.28,
"r_y1": 480.97,
"r_x2": 116.28,
"r_y2": 472.96,
"r_x3": 70.03,
"r_y3": 472.96,
"coord_origin": "TOPLEFT"
},
"text": "mitru Erhan.",
"orig": "mitru Erhan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.48,
"r_y0": 480.97,
"r_x1": 286.36,
"r_y1": 480.97,
"r_x2": 286.36,
"r_y2": 472.96,
"r_x3": 122.48,
"r_y3": 472.96,
"coord_origin": "TOPLEFT"
},
"text": "Show and tell: A neural image caption gen-",
"orig": "Show and tell: A neural image caption gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 491.93,
"r_x1": 103.31,
"r_y1": 491.93,
"r_x2": 103.31,
"r_y2": 483.92,
"r_x3": 70.03,
"r_y3": 483.92,
"coord_origin": "TOPLEFT"
},
"text": "erator. In",
"orig": "erator. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 105.52,
"r_y0": 491.73,
"r_x1": 286.36,
"r_y1": 491.73,
"r_x2": 286.36,
"r_y2": 484.0,
"r_x3": 105.52,
"r_y3": 484.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE Conference on Computer",
"orig": "Proceedings of the IEEE Conference on Computer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 502.69,
"r_x1": 212.52,
"r_y1": 502.69,
"r_x2": 212.52,
"r_y2": 494.96,
"r_x3": 70.03,
"r_y3": 494.96,
"coord_origin": "TOPLEFT"
},
"text": "Vision and Pattern Recognition (CVPR)",
"orig": "Vision and Pattern Recognition (CVPR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.51,
"r_y0": 502.89,
"r_x1": 263.56,
"r_y1": 502.89,
"r_x2": 263.56,
"r_y2": 494.88,
"r_x3": 212.51,
"r_y3": 494.88,
"coord_origin": "TOPLEFT"
},
"text": ", June 2015. 2",
"orig": ", June 2015. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2"
},
{
"label": "list_item",
"id": 7,
"page_no": 9,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 506.2,
"r": 286.36,
"b": 547.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.841,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 514.22,
"r_x1": 65.68,
"r_y1": 514.22,
"r_x2": 65.68,
"r_y2": 506.2,
"r_x3": 50.11,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "[33]",
"orig": "[33]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.02,
"r_y0": 514.22,
"r_x1": 247.37,
"r_y1": 514.22,
"r_x2": 247.37,
"r_y2": 506.2,
"r_x3": 68.02,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 253.97,
"r_y0": 514.22,
"r_x1": 286.36,
"r_y1": 514.22,
"r_x2": 286.36,
"r_y2": 506.2,
"r_x3": 253.97,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Res2tim:",
"orig": "Res2tim:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 525.18,
"r_x1": 265.62,
"r_y1": 525.18,
"r_x2": 265.62,
"r_y2": 517.16,
"r_x3": 70.03,
"r_y3": 517.16,
"coord_origin": "TOPLEFT"
},
"text": "reconstruct syntactic structures from table images. In",
"orig": "reconstruct syntactic structures from table images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 268.43,
"r_y0": 524.97,
"r_x1": 286.36,
"r_y1": 524.97,
"r_x2": 286.36,
"r_y2": 517.24,
"r_x3": 268.43,
"r_y3": 517.24,
"coord_origin": "TOPLEFT"
},
"text": "2019",
"orig": "2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 535.93,
"r_x1": 286.36,
"r_y1": 535.93,
"r_x2": 286.36,
"r_y2": 528.2,
"r_x3": 70.03,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Document Analysis and Recog-",
"orig": "International Conference on Document Analysis and Recog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 546.89,
"r_x1": 125.26,
"r_y1": 546.89,
"r_x2": 125.26,
"r_y2": 539.16,
"r_x3": 70.03,
"r_y3": 539.16,
"coord_origin": "TOPLEFT"
},
"text": "nition (ICDAR)",
"orig": "nition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.25,
"r_y0": 547.09,
"r_x1": 240.05,
"r_y1": 547.09,
"r_x2": 240.05,
"r_y2": 539.08,
"r_x3": 125.25,
"r_y3": 539.08,
"coord_origin": "TOPLEFT"
},
"text": ", pages 749-755. IEEE, 2019. 3",
"orig": ", pages 749-755. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 11,
"page_no": 9,
"cluster": {
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 550.4,
"r": 286.36,
"b": 591.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.824,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 558.42,
"r_x1": 66.04,
"r_y1": 558.42,
"r_x2": 66.04,
"r_y2": 550.4,
"r_x3": 50.11,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "[34]",
"orig": "[34]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.43,
"r_y0": 558.42,
"r_x1": 286.36,
"r_y1": 558.42,
"r_x2": 286.36,
"r_y2": 550.4,
"r_x3": 68.43,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 569.38,
"r_x1": 137.08,
"r_y1": 569.38,
"r_x2": 137.08,
"r_y2": 561.36,
"r_x3": 70.03,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "and Qingyong Li.",
"orig": "and Qingyong Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.99,
"r_y0": 569.38,
"r_x1": 172.38,
"r_y1": 569.38,
"r_x2": 172.38,
"r_y2": 561.36,
"r_x3": 145.99,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "Tgrnet:",
"orig": "Tgrnet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.7,
"r_y0": 569.38,
"r_x1": 286.36,
"r_y1": 569.38,
"r_x2": 286.36,
"r_y2": 561.36,
"r_x3": 178.7,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "A table graph reconstruction",
"orig": "A table graph reconstruction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 580.33,
"r_x1": 221.01,
"r_y1": 580.33,
"r_x2": 221.01,
"r_y2": 572.32,
"r_x3": 70.03,
"r_y3": 572.32,
"coord_origin": "TOPLEFT"
},
"text": "network for table structure recognition.",
"orig": "network for table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.54,
"r_y0": 580.13,
"r_x1": 286.36,
"r_y1": 580.13,
"r_x2": 286.36,
"r_y2": 572.4,
"r_x3": 232.54,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint",
"orig": "arXiv preprint",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 591.09,
"r_x1": 135.53,
"r_y1": 591.09,
"r_x2": 135.53,
"r_y2": 583.36,
"r_x3": 70.03,
"r_y3": 583.36,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2106.10598",
"orig": "arXiv:2106.10598",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.53,
"r_y0": 591.29,
"r_x1": 167.9,
"r_y1": 591.29,
"r_x2": 167.9,
"r_y2": 583.28,
"r_x3": 135.53,
"r_y3": 583.28,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 3",
"orig": ", 2021. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3"
},
{
"label": "list_item",
"id": 10,
"page_no": 9,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 594.6,
"r": 286.36,
"b": 635.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.836,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 602.62,
"r_x1": 65.24,
"r_y1": 602.62,
"r_x2": 65.24,
"r_y2": 594.6,
"r_x3": 50.11,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "[35]",
"orig": "[35]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.51,
"r_y0": 602.62,
"r_x1": 286.36,
"r_y1": 602.62,
"r_x2": 286.36,
"r_y2": 594.6,
"r_x3": 67.51,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 613.58,
"r_x1": 109.11,
"r_y1": 613.58,
"r_x2": 109.11,
"r_y2": 605.56,
"r_x3": 70.03,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "Jiebo Luo.",
"orig": "Jiebo Luo.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.23,
"r_y0": 613.58,
"r_x1": 271.77,
"r_y1": 613.58,
"r_x2": 271.77,
"r_y2": 605.56,
"r_x3": 116.23,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "Image captioning with semantic attention.",
"orig": "Image captioning with semantic attention.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.89,
"r_y0": 613.58,
"r_x1": 286.36,
"r_y1": 613.58,
"r_x2": 286.36,
"r_y2": 605.56,
"r_x3": 278.89,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 624.33,
"r_x1": 286.36,
"r_y1": 624.33,
"r_x2": 286.36,
"r_y2": 616.6,
"r_x3": 70.03,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE conference on computer vision and",
"orig": "Proceedings of the IEEE conference on computer vision and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 635.29,
"r_x1": 139.1,
"r_y1": 635.29,
"r_x2": 139.1,
"r_y2": 627.56,
"r_x3": 70.03,
"r_y3": 627.56,
"coord_origin": "TOPLEFT"
},
"text": "pattern recognition",
"orig": "pattern recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 139.1,
"r_y0": 635.49,
"r_x1": 238.96,
"r_y1": 635.49,
"r_x2": 238.96,
"r_y2": 627.48,
"r_x3": 139.1,
"r_y3": 627.48,
"coord_origin": "TOPLEFT"
},
"text": ", pages 4651-4659, 2016. 4",
"orig": ", pages 4651-4659, 2016. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4"
},
{
"label": "list_item",
"id": 12,
"page_no": 9,
"cluster": {
"id": 12,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 638.8,
"r": 286.36,
"b": 690.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.808,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 646.82,
"r_x1": 65.2,
"r_y1": 646.82,
"r_x2": 65.2,
"r_y2": 638.8,
"r_x3": 50.11,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "[36]",
"orig": "[36]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.47,
"r_y0": 646.82,
"r_x1": 286.36,
"r_y1": 646.82,
"r_x2": 286.36,
"r_y2": 638.8,
"r_x3": 67.47,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 657.78,
"r_x1": 286.36,
"r_y1": 657.78,
"r_x2": 286.36,
"r_y2": 649.76,
"r_x3": 70.03,
"r_y3": 649.76,
"coord_origin": "TOPLEFT"
},
"text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 668.74,
"r_x1": 286.36,
"r_y1": 668.74,
"r_x2": 286.36,
"r_y2": 660.72,
"r_x3": 70.03,
"r_y3": 660.72,
"coord_origin": "TOPLEFT"
},
"text": "work for joint table identification and cell structure recogni-",
"orig": "work for joint table identification and cell structure recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 679.69,
"r_x1": 158.46,
"r_y1": 679.69,
"r_x2": 158.46,
"r_y2": 671.68,
"r_x3": 70.03,
"r_y3": 671.68,
"coord_origin": "TOPLEFT"
},
"text": "tion using visual context.",
"orig": "tion using visual context.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.53,
"r_y0": 679.49,
"r_x1": 286.36,
"r_y1": 679.49,
"r_x2": 286.36,
"r_y2": 671.76,
"r_x3": 160.53,
"r_y3": 671.76,
"coord_origin": "TOPLEFT"
},
"text": "Winter Conference for Applications",
"orig": "Winter Conference for Applications",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 690.45,
"r_x1": 171.42,
"r_y1": 690.45,
"r_x2": 171.42,
"r_y2": 682.72,
"r_x3": 70.03,
"r_y3": 682.72,
"coord_origin": "TOPLEFT"
},
"text": "in Computer Vision (WACV)",
"orig": "in Computer Vision (WACV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.42,
"r_y0": 690.65,
"r_x1": 212.76,
"r_y1": 690.65,
"r_x2": 212.76,
"r_y2": 682.64,
"r_x3": 171.42,
"r_y3": 682.64,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 2, 3",
"orig": ", 2021. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3"
},
{
"label": "list_item",
"id": 8,
"page_no": 9,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 693.96,
"r": 286.36,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.839,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.98,
"r_x1": 66.51,
"r_y1": 701.98,
"r_x2": 66.51,
"r_y2": 693.96,
"r_x3": 50.11,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "[37]",
"orig": "[37]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.97,
"r_y0": 701.98,
"r_x1": 80.99,
"r_y1": 701.98,
"r_x2": 80.99,
"r_y2": 693.96,
"r_x3": 68.97,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Xu",
"orig": "Xu",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.06,
"r_y0": 701.98,
"r_x1": 114.71,
"r_y1": 701.98,
"r_x2": 114.71,
"r_y2": 693.96,
"r_x3": 89.06,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Zhong,",
"orig": "Zhong,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.25,
"r_y0": 701.98,
"r_x1": 149.15,
"r_y1": 701.98,
"r_x2": 149.15,
"r_y2": 693.96,
"r_x3": 124.25,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Elaheh",
"orig": "Elaheh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.22,
"r_y0": 701.98,
"r_x1": 209.37,
"r_y1": 701.98,
"r_x2": 209.37,
"r_y2": 693.96,
"r_x3": 157.22,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "ShafieiBavani,",
"orig": "ShafieiBavani,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.9,
"r_y0": 701.98,
"r_x1": 231.85,
"r_y1": 701.98,
"r_x2": 231.85,
"r_y2": 693.96,
"r_x3": 218.9,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.93,
"r_y0": 701.98,
"r_x1": 269.32,
"r_y1": 701.98,
"r_x2": 269.32,
"r_y2": 693.96,
"r_x3": 239.93,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Antonio",
"orig": "Antonio",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 277.39,
"r_y0": 701.98,
"r_x1": 286.36,
"r_y1": 701.98,
"r_x2": 286.36,
"r_y2": 693.96,
"r_x3": 277.39,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Ji-",
"orig": "Ji-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 712.94,
"r_x1": 286.36,
"r_y1": 712.94,
"r_x2": 286.36,
"r_y2": 704.92,
"r_x3": 70.03,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "meno Yepes. Image-based table recognition: Data, model,",
"orig": "meno Yepes. Image-based table recognition: Data, model,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model,"
},
{
"label": "list_item",
"id": 14,
"page_no": 9,
"cluster": {
"id": 14,
"label": "list_item",
"bbox": {
"l": 328.78,
"t": 75.88,
"r": 545.11,
"b": 116.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.756,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 83.9,
"r_x1": 545.11,
"r_y1": 83.9,
"r_x2": 545.11,
"r_y2": 75.88,
"r_x3": 328.78,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 94.86,
"r_x1": 472.31,
"r_y1": 94.86,
"r_x2": 472.31,
"r_y2": 86.84,
"r_x3": 328.78,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "Brox, and Jan-Michael Frahm, editors,",
"orig": "Brox, and Jan-Michael Frahm, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.89,
"r_y0": 94.65,
"r_x1": 545.11,
"r_y1": 94.65,
"r_x2": 545.11,
"r_y2": 86.92,
"r_x3": 475.89,
"r_y3": 86.92,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision -",
"orig": "Computer Vision -",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 105.61,
"r_x1": 371.93,
"r_y1": 105.61,
"r_x2": 371.93,
"r_y2": 97.88,
"r_x3": 328.78,
"r_y3": 97.88,
"coord_origin": "TOPLEFT"
},
"text": "ECCV 2020",
"orig": "ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.93,
"r_y0": 105.82,
"r_x1": 545.11,
"r_y1": 105.82,
"r_x2": 545.11,
"r_y2": 97.8,
"r_x3": 371.93,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 564-580, Cham, 2020. Springer Interna-",
"orig": ", pages 564-580, Cham, 2020. Springer Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 116.78,
"r_x1": 417.7,
"r_y1": 116.78,
"r_x2": 417.7,
"r_y2": 108.76,
"r_x3": 328.78,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "tional Publishing. 2, 3, 7",
"orig": "tional Publishing. 2, 3, 7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7"
},
{
"label": "list_item",
"id": 9,
"page_no": 9,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 120.71,
"r": 545.11,
"b": 161.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.838,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 128.73,
"r_x1": 324.33,
"r_y1": 128.73,
"r_x2": 324.33,
"r_y2": 120.71,
"r_x3": 308.86,
"r_y3": 120.71,
"coord_origin": "TOPLEFT"
},
"text": "[38]",
"orig": "[38]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.65,
"r_y0": 128.73,
"r_x1": 545.11,
"r_y1": 128.73,
"r_x2": 545.11,
"r_y2": 120.71,
"r_x3": 326.65,
"r_y3": 120.71,
"coord_origin": "TOPLEFT"
},
"text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 139.69,
"r_x1": 545.11,
"r_y1": 139.69,
"r_x2": 545.11,
"r_y2": 131.67,
"r_x3": 328.78,
"r_y3": 131.67,
"coord_origin": "TOPLEFT"
},
"text": "laynet: Largest dataset ever for document layout analysis. In",
"orig": "laynet: Largest dataset ever for document layout analysis. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 150.44,
"r_x1": 545.11,
"r_y1": 150.44,
"r_x2": 545.11,
"r_y2": 142.71,
"r_x3": 328.78,
"r_y3": 142.71,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 161.4,
"r_x1": 406.32,
"r_y1": 161.4,
"r_x2": 406.32,
"r_y2": 153.67,
"r_x3": 328.78,
"r_y3": 153.67,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.32,
"r_y0": 161.61,
"r_x1": 506.18,
"r_y1": 161.61,
"r_x2": 506.18,
"r_y2": 153.59,
"r_x3": 406.32,
"r_y3": 153.59,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1015-1022, 2019. 1",
"orig": ", pages 1015-1022, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1"
},
{
"label": "page_footer",
"id": 0,
"page_no": 9,
"cluster": {
"id": 0,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.907,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "10"
}
],
"body": [
{
"label": "text",
"id": 15,
"page_no": 9,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 70.03,
"t": 75.88,
"r": 286.36,
"b": 94.86,
"coord_origin": "TOPLEFT"
},
"confidence": 0.689,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 83.69,
"r_x1": 223.58,
"r_y1": 83.69,
"r_x2": 223.58,
"r_y2": 75.96,
"r_x3": 70.03,
"r_y3": 75.96,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision and Pattern Recognition",
"orig": "Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 223.58,
"r_y0": 83.9,
"r_x1": 286.36,
"r_y1": 83.9,
"r_x2": 286.36,
"r_y2": 75.88,
"r_x3": 223.58,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": ", pages 658-666,",
"orig": ", pages 658-666,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 94.86,
"r_x1": 97.92,
"r_y1": 94.86,
"r_x2": 97.92,
"r_y2": 86.84,
"r_x3": 70.03,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "2019. 6",
"orig": "2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6"
},
{
"label": "list_item",
"id": 13,
"page_no": 9,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 98.17,
"r": 286.37,
"b": 160.98,
"coord_origin": "TOPLEFT"
},
"confidence": 0.772,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 106.18,
"r_x1": 65.53,
"r_y1": 106.18,
"r_x2": 65.53,
"r_y2": 98.17,
"r_x3": 50.11,
"r_y3": 98.17,
"coord_origin": "TOPLEFT"
},
"text": "[26]",
"orig": "[26]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.85,
"r_y0": 106.18,
"r_x1": 286.36,
"r_y1": 106.18,
"r_x2": 286.36,
"r_y2": 98.17,
"r_x3": 67.85,
"r_y3": 98.17,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 117.14,
"r_x1": 286.36,
"r_y1": 117.14,
"r_x2": 286.36,
"r_y2": 109.12,
"r_x3": 70.03,
"r_y3": 109.12,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 128.1,
"r_x1": 286.36,
"r_y1": 128.1,
"r_x2": 286.36,
"r_y2": 120.08,
"r_x3": 70.03,
"r_y3": 120.08,
"coord_origin": "TOPLEFT"
},
"text": "tion and structure recognition of tables in document images.",
"orig": "tion and structure recognition of tables in document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 139.06,
"r_x1": 77.5,
"r_y1": 139.06,
"r_x2": 77.5,
"r_y2": 131.04,
"r_x3": 70.03,
"r_y3": 131.04,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 80.56,
"r_y0": 138.85,
"r_x1": 286.37,
"r_y1": 138.85,
"r_x2": 286.37,
"r_y2": 131.12,
"r_x3": 80.56,
"r_y3": 131.12,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR International Conference on Document",
"orig": "2017 14th IAPR International Conference on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 149.81,
"r_x1": 195.23,
"r_y1": 149.81,
"r_x2": 195.23,
"r_y2": 142.08,
"r_x3": 70.03,
"r_y3": 142.08,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (ICDAR)",
"orig": "Analysis and Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.23,
"r_y0": 150.02,
"r_x1": 286.37,
"r_y1": 150.02,
"r_x2": 286.37,
"r_y2": 142.0,
"r_x3": 195.23,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": ", volume 01, pages 1162-",
"orig": ", volume 01, pages 1162-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 160.98,
"r_x1": 120.33,
"r_y1": 160.98,
"r_x2": 120.33,
"r_y2": 152.96,
"r_x3": 70.03,
"r_y3": 152.96,
"coord_origin": "TOPLEFT"
},
"text": "1167, 2017. 1",
"orig": "1167, 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1"
},
{
"label": "list_item",
"id": 2,
"page_no": 9,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 164.28,
"r": 286.36,
"b": 227.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.858,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 172.3,
"r_x1": 65.53,
"r_y1": 172.3,
"r_x2": 65.53,
"r_y2": 164.28,
"r_x3": 50.11,
"r_y3": 164.28,
"coord_origin": "TOPLEFT"
},
"text": "[27]",
"orig": "[27]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.85,
"r_y0": 172.3,
"r_x1": 286.36,
"r_y1": 172.3,
"r_x2": 286.36,
"r_y2": 164.28,
"r_x3": 67.85,
"r_y3": 164.28,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 183.26,
"r_x1": 286.36,
"r_y1": 183.26,
"r_x2": 286.36,
"r_y2": 175.24,
"r_x3": 70.03,
"r_y3": 175.24,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 194.22,
"r_x1": 286.36,
"r_y1": 194.22,
"r_x2": 286.36,
"r_y2": 186.2,
"r_x3": 70.03,
"r_y3": 186.2,
"coord_origin": "TOPLEFT"
},
"text": "tection and structure recognition of tables in document im-",
"orig": "tection and structure recognition of tables in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 205.18,
"r_x1": 101.33,
"r_y1": 205.18,
"r_x2": 101.33,
"r_y2": 197.16,
"r_x3": 70.03,
"r_y3": 197.16,
"coord_origin": "TOPLEFT"
},
"text": "ages. In",
"orig": "ages. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.33,
"r_y0": 204.97,
"r_x1": 286.36,
"r_y1": 204.97,
"r_x2": 286.36,
"r_y2": 197.24,
"r_x3": 104.33,
"r_y3": 197.24,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR international conference on doc-",
"orig": "2017 14th IAPR international conference on doc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 215.93,
"r_x1": 220.49,
"r_y1": 215.93,
"r_x2": 220.49,
"r_y2": 208.2,
"r_x3": 70.03,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "ument analysis and recognition (ICDAR)",
"orig": "ument analysis and recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.48,
"r_y0": 216.14,
"r_x1": 286.36,
"r_y1": 216.14,
"r_x2": 286.36,
"r_y2": 208.12,
"r_x3": 220.48,
"r_y3": 208.12,
"coord_origin": "TOPLEFT"
},
"text": ", volume 1, pages",
"orig": ", volume 1, pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 227.09,
"r_x1": 166.65,
"r_y1": 227.09,
"r_x2": 166.65,
"r_y2": 219.08,
"r_x3": 70.03,
"r_y3": 219.08,
"coord_origin": "TOPLEFT"
},
"text": "1162-1167. IEEE, 2017. 3",
"orig": "1162-1167. IEEE, 2017. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3"
},
{
"label": "list_item",
"id": 4,
"page_no": 9,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 230.4,
"r": 286.37,
"b": 271.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.851,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 238.42,
"r_x1": 65.65,
"r_y1": 238.42,
"r_x2": 65.65,
"r_y2": 230.4,
"r_x3": 50.11,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "[28]",
"orig": "[28]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.98,
"r_y0": 238.42,
"r_x1": 286.36,
"r_y1": 238.42,
"r_x2": 286.36,
"r_y2": 230.4,
"r_x3": 67.98,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 249.38,
"r_x1": 147.17,
"r_y1": 249.38,
"r_x2": 147.17,
"r_y2": 241.36,
"r_x3": 70.03,
"r_y3": 241.36,
"coord_origin": "TOPLEFT"
},
"text": "neous documents. In",
"orig": "neous documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.93,
"r_y0": 249.17,
"r_x1": 286.37,
"r_y1": 249.17,
"r_x2": 286.37,
"r_y2": 241.44,
"r_x3": 149.93,
"r_y3": 241.44,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the 9th IAPR Interna-",
"orig": "Proceedings of the 9th IAPR Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 260.13,
"r_x1": 244.69,
"r_y1": 260.13,
"r_x2": 244.69,
"r_y2": 252.4,
"r_x3": 70.03,
"r_y3": 252.4,
"coord_origin": "TOPLEFT"
},
"text": "tional Workshop on Document Analysis Systems",
"orig": "tional Workshop on Document Analysis Systems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 244.69,
"r_y0": 260.34,
"r_x1": 286.36,
"r_y1": 260.34,
"r_x2": 286.36,
"r_y2": 252.32,
"r_x3": 244.69,
"r_y3": 252.32,
"coord_origin": "TOPLEFT"
},
"text": ", pages 65-",
"orig": ", pages 65-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 271.3,
"r_x1": 111.37,
"r_y1": 271.3,
"r_x2": 111.37,
"r_y2": 263.28,
"r_x3": 70.03,
"r_y3": 263.28,
"coord_origin": "TOPLEFT"
},
"text": "72, 2010. 2",
"orig": "72, 2010. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2"
},
{
"label": "list_item",
"id": 5,
"page_no": 9,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 274.6,
"r": 286.37,
"b": 326.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.849,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 282.62,
"r_x1": 66.02,
"r_y1": 282.62,
"r_x2": 66.02,
"r_y2": 274.6,
"r_x3": 50.11,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "[29]",
"orig": "[29]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.41,
"r_y0": 282.62,
"r_x1": 94.94,
"r_y1": 282.62,
"r_x2": 94.94,
"r_y2": 274.6,
"r_x3": 68.41,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Shoaib",
"orig": "Shoaib",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 100.87,
"r_y0": 282.62,
"r_x1": 127.27,
"r_y1": 282.62,
"r_x2": 127.27,
"r_y2": 274.6,
"r_x3": 100.87,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed",
"orig": "Ahmed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.19,
"r_y0": 282.62,
"r_x1": 165.83,
"r_y1": 282.62,
"r_x2": 165.83,
"r_y2": 274.6,
"r_x3": 133.19,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Siddiqui,",
"orig": "Siddiqui,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 172.68,
"r_y0": 282.62,
"r_x1": 194.09,
"r_y1": 282.62,
"r_x2": 194.09,
"r_y2": 274.6,
"r_x3": 172.68,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Imran",
"orig": "Imran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.02,
"r_y0": 282.62,
"r_x1": 211.48,
"r_y1": 282.62,
"r_x2": 211.48,
"r_y2": 274.6,
"r_x3": 200.02,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ali",
"orig": "Ali",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.41,
"r_y0": 282.62,
"r_x1": 239.44,
"r_y1": 282.62,
"r_x2": 239.44,
"r_y2": 274.6,
"r_x3": 217.41,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Fateh,",
"orig": "Fateh,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.29,
"r_y0": 282.62,
"r_x1": 264.22,
"r_y1": 282.62,
"r_x2": 264.22,
"r_y2": 274.6,
"r_x3": 246.29,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Syed",
"orig": "Syed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.15,
"r_y0": 282.62,
"r_x1": 286.36,
"r_y1": 282.62,
"r_x2": 286.36,
"r_y2": 274.6,
"r_x3": 270.15,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Tah-",
"orig": "Tah-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 293.58,
"r_x1": 286.36,
"r_y1": 293.58,
"r_x2": 286.36,
"r_y2": 285.56,
"r_x3": 70.03,
"r_y3": 285.56,
"coord_origin": "TOPLEFT"
},
"text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 304.54,
"r_x1": 286.36,
"r_y1": 304.54,
"r_x2": 286.36,
"r_y2": 296.52,
"r_x3": 70.03,
"r_y3": 296.52,
"coord_origin": "TOPLEFT"
},
"text": "Deeptabstr: Deep learning based table structure recognition.",
"orig": "Deeptabstr: Deep learning based table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 315.5,
"r_x1": 77.5,
"r_y1": 315.5,
"r_x2": 77.5,
"r_y2": 307.48,
"r_x3": 70.03,
"r_y3": 307.48,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.35,
"r_y0": 315.29,
"r_x1": 286.37,
"r_y1": 315.29,
"r_x2": 286.37,
"r_y2": 307.56,
"r_x3": 79.35,
"r_y3": 307.56,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 326.25,
"r_x1": 147.57,
"r_y1": 326.25,
"r_x2": 147.57,
"r_y2": 318.52,
"r_x3": 70.03,
"r_y3": 318.52,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.57,
"r_y0": 326.45,
"r_x1": 271.34,
"r_y1": 326.45,
"r_x2": 271.34,
"r_y2": 318.44,
"r_x3": 147.57,
"r_y3": 318.44,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1403-1409. IEEE, 2019. 3",
"orig": ", pages 1403-1409. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 3,
"page_no": 9,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 329.76,
"r": 286.36,
"b": 381.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 337.78,
"r_x1": 65.37,
"r_y1": 337.78,
"r_x2": 65.37,
"r_y2": 329.76,
"r_x3": 50.11,
"r_y3": 329.76,
"coord_origin": "TOPLEFT"
},
"text": "[30]",
"orig": "[30]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.66,
"r_y0": 337.78,
"r_x1": 286.36,
"r_y1": 337.78,
"r_x2": 286.36,
"r_y2": 329.76,
"r_x3": 67.66,
"r_y3": 329.76,
"coord_origin": "TOPLEFT"
},
"text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 348.74,
"r_x1": 286.36,
"r_y1": 348.74,
"r_x2": 286.36,
"r_y2": 340.72,
"r_x3": 70.03,
"r_y3": 340.72,
"coord_origin": "TOPLEFT"
},
"text": "Bekas. Corpus conversion service: A machine learning plat-",
"orig": "Bekas. Corpus conversion service: A machine learning plat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 359.7,
"r_x1": 198.82,
"r_y1": 359.7,
"r_x2": 198.82,
"r_y2": 351.68,
"r_x3": 70.03,
"r_y3": 351.68,
"coord_origin": "TOPLEFT"
},
"text": "form to ingest documents at scale.",
"orig": "form to ingest documents at scale.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.06,
"r_y0": 359.7,
"r_x1": 213.53,
"r_y1": 359.7,
"r_x2": 213.53,
"r_y2": 351.68,
"r_x3": 206.06,
"r_y3": 351.68,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.02,
"r_y0": 359.49,
"r_x1": 286.36,
"r_y1": 359.49,
"r_x2": 286.36,
"r_y2": 351.76,
"r_x3": 217.02,
"r_y3": 351.76,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the",
"orig": "Proceedings of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 370.45,
"r_x1": 143.08,
"r_y1": 370.45,
"r_x2": 143.08,
"r_y2": 362.72,
"r_x3": 70.03,
"r_y3": 362.72,
"coord_origin": "TOPLEFT"
},
"text": "24th ACM SIGKDD",
"orig": "24th ACM SIGKDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.08,
"r_y0": 370.66,
"r_x1": 286.36,
"r_y1": 370.66,
"r_x2": 286.36,
"r_y2": 362.64,
"r_x3": 143.08,
"r_y3": 362.64,
"coord_origin": "TOPLEFT"
},
"text": ", KDD \u201918, pages 774-782, New York,",
"orig": ", KDD \u201918, pages 774-782, New York,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 381.61,
"r_x1": 161.16,
"r_y1": 381.61,
"r_x2": 161.16,
"r_y2": 373.6,
"r_x3": 70.03,
"r_y3": 373.6,
"coord_origin": "TOPLEFT"
},
"text": "NY, USA, 2018. ACM. 1",
"orig": "NY, USA, 2018. ACM. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[30] Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1"
},
{
"label": "list_item",
"id": 1,
"page_no": 9,
"cluster": {
"id": 1,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 384.92,
"r": 286.36,
"b": 458.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.883,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 392.94,
"r_x1": 65.14,
"r_y1": 392.94,
"r_x2": 65.14,
"r_y2": 384.92,
"r_x3": 50.11,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "[31]",
"orig": "[31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 392.94,
"r_x1": 286.36,
"r_y1": 392.94,
"r_x2": 286.36,
"r_y2": 384.92,
"r_x3": 67.4,
"r_y3": 384.92,
"coord_origin": "TOPLEFT"
},
"text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 403.9,
"r_x1": 286.36,
"r_y1": 403.9,
"r_x2": 286.36,
"r_y2": 395.88,
"r_x3": 70.03,
"r_y3": 395.88,
"coord_origin": "TOPLEFT"
},
"text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 414.86,
"r_x1": 125.47,
"r_y1": 414.86,
"r_x2": 125.47,
"r_y2": 406.84,
"r_x3": 70.03,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "lia Polosukhin.",
"orig": "lia Polosukhin.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.91,
"r_y0": 414.86,
"r_x1": 230.83,
"r_y1": 414.86,
"r_x2": 230.83,
"r_y2": 406.84,
"r_x3": 133.91,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "Attention is all you need.",
"orig": "Attention is all you need.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.27,
"r_y0": 414.86,
"r_x1": 286.36,
"r_y1": 414.86,
"r_x2": 286.36,
"r_y2": 406.84,
"r_x3": 239.27,
"r_y3": 406.84,
"coord_origin": "TOPLEFT"
},
"text": "In I. Guyon,",
"orig": "In I. Guyon,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 425.82,
"r_x1": 78.96,
"r_y1": 425.82,
"r_x2": 78.96,
"r_y2": 417.8,
"r_x3": 70.03,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "U.",
"orig": "U.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.25,
"r_y0": 425.82,
"r_x1": 286.36,
"r_y1": 425.82,
"r_x2": 286.36,
"r_y2": 417.8,
"r_x3": 81.25,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 436.77,
"r_x1": 196.76,
"r_y1": 436.77,
"r_x2": 196.76,
"r_y2": 428.76,
"r_x3": 70.03,
"r_y3": 428.76,
"coord_origin": "TOPLEFT"
},
"text": "wanathan, and R. Garnett, editors,",
"orig": "wanathan, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.2,
"r_y0": 436.57,
"r_x1": 286.36,
"r_y1": 436.57,
"r_x2": 286.36,
"r_y2": 428.84,
"r_x3": 200.2,
"r_y3": 428.84,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural In-",
"orig": "Advances in Neural In-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 447.53,
"r_x1": 189.19,
"r_y1": 447.53,
"r_x2": 189.19,
"r_y2": 439.8,
"r_x3": 70.03,
"r_y3": 439.8,
"coord_origin": "TOPLEFT"
},
"text": "formation Processing Systems 30",
"orig": "formation Processing Systems 30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.2,
"r_y0": 447.73,
"r_x1": 286.36,
"r_y1": 447.73,
"r_x2": 286.36,
"r_y2": 439.72,
"r_x3": 189.2,
"r_y3": 439.72,
"coord_origin": "TOPLEFT"
},
"text": ", pages 5998-6008. Curran",
"orig": ", pages 5998-6008. Curran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 458.69,
"r_x1": 158.92,
"r_y1": 458.69,
"r_x2": 158.92,
"r_y2": 450.68,
"r_x3": 70.03,
"r_y3": 450.68,
"coord_origin": "TOPLEFT"
},
"text": "Associates, Inc., 2017. 5",
"orig": "Associates, Inc., 2017. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5"
},
{
"label": "list_item",
"id": 6,
"page_no": 9,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 462.0,
"r": 286.36,
"b": 502.89,
"coord_origin": "TOPLEFT"
},
"confidence": 0.843,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 470.02,
"r_x1": 65.91,
"r_y1": 470.02,
"r_x2": 65.91,
"r_y2": 462.0,
"r_x3": 50.11,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "[32]",
"orig": "[32]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.28,
"r_y0": 470.02,
"r_x1": 286.36,
"r_y1": 470.02,
"r_x2": 286.36,
"r_y2": 462.0,
"r_x3": 68.28,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 480.97,
"r_x1": 116.28,
"r_y1": 480.97,
"r_x2": 116.28,
"r_y2": 472.96,
"r_x3": 70.03,
"r_y3": 472.96,
"coord_origin": "TOPLEFT"
},
"text": "mitru Erhan.",
"orig": "mitru Erhan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.48,
"r_y0": 480.97,
"r_x1": 286.36,
"r_y1": 480.97,
"r_x2": 286.36,
"r_y2": 472.96,
"r_x3": 122.48,
"r_y3": 472.96,
"coord_origin": "TOPLEFT"
},
"text": "Show and tell: A neural image caption gen-",
"orig": "Show and tell: A neural image caption gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 491.93,
"r_x1": 103.31,
"r_y1": 491.93,
"r_x2": 103.31,
"r_y2": 483.92,
"r_x3": 70.03,
"r_y3": 483.92,
"coord_origin": "TOPLEFT"
},
"text": "erator. In",
"orig": "erator. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 105.52,
"r_y0": 491.73,
"r_x1": 286.36,
"r_y1": 491.73,
"r_x2": 286.36,
"r_y2": 484.0,
"r_x3": 105.52,
"r_y3": 484.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE Conference on Computer",
"orig": "Proceedings of the IEEE Conference on Computer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 502.69,
"r_x1": 212.52,
"r_y1": 502.69,
"r_x2": 212.52,
"r_y2": 494.96,
"r_x3": 70.03,
"r_y3": 494.96,
"coord_origin": "TOPLEFT"
},
"text": "Vision and Pattern Recognition (CVPR)",
"orig": "Vision and Pattern Recognition (CVPR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.51,
"r_y0": 502.89,
"r_x1": 263.56,
"r_y1": 502.89,
"r_x2": 263.56,
"r_y2": 494.88,
"r_x3": 212.51,
"r_y3": 494.88,
"coord_origin": "TOPLEFT"
},
"text": ", June 2015. 2",
"orig": ", June 2015. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2"
},
{
"label": "list_item",
"id": 7,
"page_no": 9,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 506.2,
"r": 286.36,
"b": 547.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.841,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 514.22,
"r_x1": 65.68,
"r_y1": 514.22,
"r_x2": 65.68,
"r_y2": 506.2,
"r_x3": 50.11,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "[33]",
"orig": "[33]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.02,
"r_y0": 514.22,
"r_x1": 247.37,
"r_y1": 514.22,
"r_x2": 247.37,
"r_y2": 506.2,
"r_x3": 68.02,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 253.97,
"r_y0": 514.22,
"r_x1": 286.36,
"r_y1": 514.22,
"r_x2": 286.36,
"r_y2": 506.2,
"r_x3": 253.97,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Res2tim:",
"orig": "Res2tim:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 525.18,
"r_x1": 265.62,
"r_y1": 525.18,
"r_x2": 265.62,
"r_y2": 517.16,
"r_x3": 70.03,
"r_y3": 517.16,
"coord_origin": "TOPLEFT"
},
"text": "reconstruct syntactic structures from table images. In",
"orig": "reconstruct syntactic structures from table images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 268.43,
"r_y0": 524.97,
"r_x1": 286.36,
"r_y1": 524.97,
"r_x2": 286.36,
"r_y2": 517.24,
"r_x3": 268.43,
"r_y3": 517.24,
"coord_origin": "TOPLEFT"
},
"text": "2019",
"orig": "2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 535.93,
"r_x1": 286.36,
"r_y1": 535.93,
"r_x2": 286.36,
"r_y2": 528.2,
"r_x3": 70.03,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Document Analysis and Recog-",
"orig": "International Conference on Document Analysis and Recog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 546.89,
"r_x1": 125.26,
"r_y1": 546.89,
"r_x2": 125.26,
"r_y2": 539.16,
"r_x3": 70.03,
"r_y3": 539.16,
"coord_origin": "TOPLEFT"
},
"text": "nition (ICDAR)",
"orig": "nition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.25,
"r_y0": 547.09,
"r_x1": 240.05,
"r_y1": 547.09,
"r_x2": 240.05,
"r_y2": 539.08,
"r_x3": 125.25,
"r_y3": 539.08,
"coord_origin": "TOPLEFT"
},
"text": ", pages 749-755. IEEE, 2019. 3",
"orig": ", pages 749-755. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 11,
"page_no": 9,
"cluster": {
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 550.4,
"r": 286.36,
"b": 591.29,
"coord_origin": "TOPLEFT"
},
"confidence": 0.824,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 558.42,
"r_x1": 66.04,
"r_y1": 558.42,
"r_x2": 66.04,
"r_y2": 550.4,
"r_x3": 50.11,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "[34]",
"orig": "[34]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.43,
"r_y0": 558.42,
"r_x1": 286.36,
"r_y1": 558.42,
"r_x2": 286.36,
"r_y2": 550.4,
"r_x3": 68.43,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 569.38,
"r_x1": 137.08,
"r_y1": 569.38,
"r_x2": 137.08,
"r_y2": 561.36,
"r_x3": 70.03,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "and Qingyong Li.",
"orig": "and Qingyong Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.99,
"r_y0": 569.38,
"r_x1": 172.38,
"r_y1": 569.38,
"r_x2": 172.38,
"r_y2": 561.36,
"r_x3": 145.99,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "Tgrnet:",
"orig": "Tgrnet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.7,
"r_y0": 569.38,
"r_x1": 286.36,
"r_y1": 569.38,
"r_x2": 286.36,
"r_y2": 561.36,
"r_x3": 178.7,
"r_y3": 561.36,
"coord_origin": "TOPLEFT"
},
"text": "A table graph reconstruction",
"orig": "A table graph reconstruction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 580.33,
"r_x1": 221.01,
"r_y1": 580.33,
"r_x2": 221.01,
"r_y2": 572.32,
"r_x3": 70.03,
"r_y3": 572.32,
"coord_origin": "TOPLEFT"
},
"text": "network for table structure recognition.",
"orig": "network for table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.54,
"r_y0": 580.13,
"r_x1": 286.36,
"r_y1": 580.13,
"r_x2": 286.36,
"r_y2": 572.4,
"r_x3": 232.54,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint",
"orig": "arXiv preprint",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 591.09,
"r_x1": 135.53,
"r_y1": 591.09,
"r_x2": 135.53,
"r_y2": 583.36,
"r_x3": 70.03,
"r_y3": 583.36,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2106.10598",
"orig": "arXiv:2106.10598",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.53,
"r_y0": 591.29,
"r_x1": 167.9,
"r_y1": 591.29,
"r_x2": 167.9,
"r_y2": 583.28,
"r_x3": 135.53,
"r_y3": 583.28,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 3",
"orig": ", 2021. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3"
},
{
"label": "list_item",
"id": 10,
"page_no": 9,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 594.6,
"r": 286.36,
"b": 635.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.836,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 602.62,
"r_x1": 65.24,
"r_y1": 602.62,
"r_x2": 65.24,
"r_y2": 594.6,
"r_x3": 50.11,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "[35]",
"orig": "[35]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.51,
"r_y0": 602.62,
"r_x1": 286.36,
"r_y1": 602.62,
"r_x2": 286.36,
"r_y2": 594.6,
"r_x3": 67.51,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 613.58,
"r_x1": 109.11,
"r_y1": 613.58,
"r_x2": 109.11,
"r_y2": 605.56,
"r_x3": 70.03,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "Jiebo Luo.",
"orig": "Jiebo Luo.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.23,
"r_y0": 613.58,
"r_x1": 271.77,
"r_y1": 613.58,
"r_x2": 271.77,
"r_y2": 605.56,
"r_x3": 116.23,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "Image captioning with semantic attention.",
"orig": "Image captioning with semantic attention.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.89,
"r_y0": 613.58,
"r_x1": 286.36,
"r_y1": 613.58,
"r_x2": 286.36,
"r_y2": 605.56,
"r_x3": 278.89,
"r_y3": 605.56,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 624.33,
"r_x1": 286.36,
"r_y1": 624.33,
"r_x2": 286.36,
"r_y2": 616.6,
"r_x3": 70.03,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE conference on computer vision and",
"orig": "Proceedings of the IEEE conference on computer vision and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 635.29,
"r_x1": 139.1,
"r_y1": 635.29,
"r_x2": 139.1,
"r_y2": 627.56,
"r_x3": 70.03,
"r_y3": 627.56,
"coord_origin": "TOPLEFT"
},
"text": "pattern recognition",
"orig": "pattern recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 139.1,
"r_y0": 635.49,
"r_x1": 238.96,
"r_y1": 635.49,
"r_x2": 238.96,
"r_y2": 627.48,
"r_x3": 139.1,
"r_y3": 627.48,
"coord_origin": "TOPLEFT"
},
"text": ", pages 4651-4659, 2016. 4",
"orig": ", pages 4651-4659, 2016. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4"
},
{
"label": "list_item",
"id": 12,
"page_no": 9,
"cluster": {
"id": 12,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 638.8,
"r": 286.36,
"b": 690.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.808,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 646.82,
"r_x1": 65.2,
"r_y1": 646.82,
"r_x2": 65.2,
"r_y2": 638.8,
"r_x3": 50.11,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "[36]",
"orig": "[36]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.47,
"r_y0": 646.82,
"r_x1": 286.36,
"r_y1": 646.82,
"r_x2": 286.36,
"r_y2": 638.8,
"r_x3": 67.47,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 657.78,
"r_x1": 286.36,
"r_y1": 657.78,
"r_x2": 286.36,
"r_y2": 649.76,
"r_x3": 70.03,
"r_y3": 649.76,
"coord_origin": "TOPLEFT"
},
"text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 668.74,
"r_x1": 286.36,
"r_y1": 668.74,
"r_x2": 286.36,
"r_y2": 660.72,
"r_x3": 70.03,
"r_y3": 660.72,
"coord_origin": "TOPLEFT"
},
"text": "work for joint table identification and cell structure recogni-",
"orig": "work for joint table identification and cell structure recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 679.69,
"r_x1": 158.46,
"r_y1": 679.69,
"r_x2": 158.46,
"r_y2": 671.68,
"r_x3": 70.03,
"r_y3": 671.68,
"coord_origin": "TOPLEFT"
},
"text": "tion using visual context.",
"orig": "tion using visual context.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.53,
"r_y0": 679.49,
"r_x1": 286.36,
"r_y1": 679.49,
"r_x2": 286.36,
"r_y2": 671.76,
"r_x3": 160.53,
"r_y3": 671.76,
"coord_origin": "TOPLEFT"
},
"text": "Winter Conference for Applications",
"orig": "Winter Conference for Applications",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 690.45,
"r_x1": 171.42,
"r_y1": 690.45,
"r_x2": 171.42,
"r_y2": 682.72,
"r_x3": 70.03,
"r_y3": 682.72,
"coord_origin": "TOPLEFT"
},
"text": "in Computer Vision (WACV)",
"orig": "in Computer Vision (WACV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.42,
"r_y0": 690.65,
"r_x1": 212.76,
"r_y1": 690.65,
"r_x2": 212.76,
"r_y2": 682.64,
"r_x3": 171.42,
"r_y3": 682.64,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 2, 3",
"orig": ", 2021. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3"
},
{
"label": "list_item",
"id": 8,
"page_no": 9,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 693.96,
"r": 286.36,
"b": 712.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.839,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 701.98,
"r_x1": 66.51,
"r_y1": 701.98,
"r_x2": 66.51,
"r_y2": 693.96,
"r_x3": 50.11,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "[37]",
"orig": "[37]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.97,
"r_y0": 701.98,
"r_x1": 80.99,
"r_y1": 701.98,
"r_x2": 80.99,
"r_y2": 693.96,
"r_x3": 68.97,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Xu",
"orig": "Xu",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.06,
"r_y0": 701.98,
"r_x1": 114.71,
"r_y1": 701.98,
"r_x2": 114.71,
"r_y2": 693.96,
"r_x3": 89.06,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Zhong,",
"orig": "Zhong,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.25,
"r_y0": 701.98,
"r_x1": 149.15,
"r_y1": 701.98,
"r_x2": 149.15,
"r_y2": 693.96,
"r_x3": 124.25,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Elaheh",
"orig": "Elaheh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.22,
"r_y0": 701.98,
"r_x1": 209.37,
"r_y1": 701.98,
"r_x2": 209.37,
"r_y2": 693.96,
"r_x3": 157.22,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "ShafieiBavani,",
"orig": "ShafieiBavani,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.9,
"r_y0": 701.98,
"r_x1": 231.85,
"r_y1": 701.98,
"r_x2": 231.85,
"r_y2": 693.96,
"r_x3": 218.9,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.93,
"r_y0": 701.98,
"r_x1": 269.32,
"r_y1": 701.98,
"r_x2": 269.32,
"r_y2": 693.96,
"r_x3": 239.93,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Antonio",
"orig": "Antonio",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 277.39,
"r_y0": 701.98,
"r_x1": 286.36,
"r_y1": 701.98,
"r_x2": 286.36,
"r_y2": 693.96,
"r_x3": 277.39,
"r_y3": 693.96,
"coord_origin": "TOPLEFT"
},
"text": "Ji-",
"orig": "Ji-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.03,
"r_y0": 712.94,
"r_x1": 286.36,
"r_y1": 712.94,
"r_x2": 286.36,
"r_y2": 704.92,
"r_x3": 70.03,
"r_y3": 704.92,
"coord_origin": "TOPLEFT"
},
"text": "meno Yepes. Image-based table recognition: Data, model,",
"orig": "meno Yepes. Image-based table recognition: Data, model,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model,"
},
{
"label": "list_item",
"id": 14,
"page_no": 9,
"cluster": {
"id": 14,
"label": "list_item",
"bbox": {
"l": 328.78,
"t": 75.88,
"r": 545.11,
"b": 116.78,
"coord_origin": "TOPLEFT"
},
"confidence": 0.756,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 83.9,
"r_x1": 545.11,
"r_y1": 83.9,
"r_x2": 545.11,
"r_y2": 75.88,
"r_x3": 328.78,
"r_y3": 75.88,
"coord_origin": "TOPLEFT"
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 94.86,
"r_x1": 472.31,
"r_y1": 94.86,
"r_x2": 472.31,
"r_y2": 86.84,
"r_x3": 328.78,
"r_y3": 86.84,
"coord_origin": "TOPLEFT"
},
"text": "Brox, and Jan-Michael Frahm, editors,",
"orig": "Brox, and Jan-Michael Frahm, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.89,
"r_y0": 94.65,
"r_x1": 545.11,
"r_y1": 94.65,
"r_x2": 545.11,
"r_y2": 86.92,
"r_x3": 475.89,
"r_y3": 86.92,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision -",
"orig": "Computer Vision -",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 105.61,
"r_x1": 371.93,
"r_y1": 105.61,
"r_x2": 371.93,
"r_y2": 97.88,
"r_x3": 328.78,
"r_y3": 97.88,
"coord_origin": "TOPLEFT"
},
"text": "ECCV 2020",
"orig": "ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.93,
"r_y0": 105.82,
"r_x1": 545.11,
"r_y1": 105.82,
"r_x2": 545.11,
"r_y2": 97.8,
"r_x3": 371.93,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 564-580, Cham, 2020. Springer Interna-",
"orig": ", pages 564-580, Cham, 2020. Springer Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 116.78,
"r_x1": 417.7,
"r_y1": 116.78,
"r_x2": 417.7,
"r_y2": 108.76,
"r_x3": 328.78,
"r_y3": 108.76,
"coord_origin": "TOPLEFT"
},
"text": "tional Publishing. 2, 3, 7",
"orig": "tional Publishing. 2, 3, 7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7"
},
{
"label": "list_item",
"id": 9,
"page_no": 9,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 120.71,
"r": 545.11,
"b": 161.61,
"coord_origin": "TOPLEFT"
},
"confidence": 0.838,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 128.73,
"r_x1": 324.33,
"r_y1": 128.73,
"r_x2": 324.33,
"r_y2": 120.71,
"r_x3": 308.86,
"r_y3": 120.71,
"coord_origin": "TOPLEFT"
},
"text": "[38]",
"orig": "[38]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.65,
"r_y0": 128.73,
"r_x1": 545.11,
"r_y1": 128.73,
"r_x2": 545.11,
"r_y2": 120.71,
"r_x3": 326.65,
"r_y3": 120.71,
"coord_origin": "TOPLEFT"
},
"text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 139.69,
"r_x1": 545.11,
"r_y1": 139.69,
"r_x2": 545.11,
"r_y2": 131.67,
"r_x3": 328.78,
"r_y3": 131.67,
"coord_origin": "TOPLEFT"
},
"text": "laynet: Largest dataset ever for document layout analysis. In",
"orig": "laynet: Largest dataset ever for document layout analysis. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 150.44,
"r_x1": 545.11,
"r_y1": 150.44,
"r_x2": 545.11,
"r_y2": 142.71,
"r_x3": 328.78,
"r_y3": 142.71,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.78,
"r_y0": 161.4,
"r_x1": 406.32,
"r_y1": 161.4,
"r_x2": 406.32,
"r_y2": 153.67,
"r_x3": 328.78,
"r_y3": 153.67,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.32,
"r_y0": 161.61,
"r_x1": 506.18,
"r_y1": 161.61,
"r_x2": 506.18,
"r_y2": 153.59,
"r_x3": 406.32,
"r_y3": 153.59,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1015-1022, 2019. 1",
"orig": ", pages 1015-1022, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1"
}
],
"headers": [
{
"label": "page_footer",
"id": 0,
"page_no": 9,
"cluster": {
"id": 0,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.907,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "10"
}
]
}
},
{
"page_no": 10,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.84,
"r_y0": 121.32,
"r_x1": 465.38,
"r_y1": 121.32,
"r_x2": 465.38,
"r_y2": 110.57,
"r_x3": 132.84,
"r_y3": 110.57,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers",
"orig": "TableFormer: Table Structure Understanding with Transformers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.18,
"r_y0": 135.53,
"r_x1": 375.04,
"r_y1": 135.53,
"r_x2": 375.04,
"r_y2": 122.26,
"r_x3": 220.18,
"r_y3": 122.26,
"coord_origin": "TOPLEFT"
},
"text": "Supplementary Material",
"orig": "Supplementary Material",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 171.91,
"r_x1": 57.09,
"r_y1": 171.91,
"r_x2": 57.09,
"r_y2": 161.16,
"r_x3": 50.11,
"r_y3": 161.16,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.39,
"r_y0": 171.91,
"r_x1": 175.96,
"r_y1": 171.91,
"r_x2": 175.96,
"r_y2": 161.16,
"r_x3": 66.39,
"r_y3": 161.16,
"coord_origin": "TOPLEFT"
},
"text": "Details on the datasets",
"orig": "Details on the datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 190.83,
"r_x1": 64.21,
"r_y1": 190.83,
"r_x2": 64.21,
"r_y2": 180.98,
"r_x3": 50.11,
"r_y3": 180.98,
"coord_origin": "TOPLEFT"
},
"text": "1.1.",
"orig": "1.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.61,
"r_y0": 190.83,
"r_x1": 150.36,
"r_y1": 190.83,
"r_x2": 150.36,
"r_y2": 180.98,
"r_x3": 73.61,
"r_y3": 180.98,
"coord_origin": "TOPLEFT"
},
"text": "Data preparation",
"orig": "Data preparation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 208.83,
"r_x1": 286.36,
"r_y1": 208.83,
"r_x2": 286.36,
"r_y2": 199.92,
"r_x3": 62.07,
"r_y3": 199.92,
"coord_origin": "TOPLEFT"
},
"text": "As a first step of our data preparation process, we have",
"orig": "As a first step of our data preparation process, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 220.78,
"r_x1": 286.37,
"r_y1": 220.78,
"r_x2": 286.37,
"r_y2": 211.88,
"r_x3": 50.11,
"r_y3": 211.88,
"coord_origin": "TOPLEFT"
},
"text": "calculated statistics over the datasets across the following",
"orig": "calculated statistics over the datasets across the following",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 232.74,
"r_x1": 286.37,
"r_y1": 232.74,
"r_x2": 286.37,
"r_y2": 223.83,
"r_x3": 50.11,
"r_y3": 223.83,
"coord_origin": "TOPLEFT"
},
"text": "dimensions: (1) table size measured in the number of rows",
"orig": "dimensions: (1) table size measured in the number of rows",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 244.69,
"r_x1": 286.37,
"r_y1": 244.69,
"r_x2": 286.37,
"r_y2": 235.79,
"r_x3": 50.11,
"r_y3": 235.79,
"coord_origin": "TOPLEFT"
},
"text": "and columns, (2) complexity of the table, (3) strictness of",
"orig": "and columns, (2) complexity of the table, (3) strictness of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 256.65,
"r_x1": 286.37,
"r_y1": 256.65,
"r_x2": 286.37,
"r_y2": 247.74,
"r_x3": 50.11,
"r_y3": 247.74,
"coord_origin": "TOPLEFT"
},
"text": "the provided HTML structure and (4) completeness (i.e. no",
"orig": "the provided HTML structure and (4) completeness (i.e. no",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 268.6,
"r_x1": 286.37,
"r_y1": 268.6,
"r_x2": 286.37,
"r_y2": 259.7,
"r_x3": 50.11,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "omitted bounding boxes). A table is considered to be simple",
"orig": "omitted bounding boxes). A table is considered to be simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 280.56,
"r_x1": 286.37,
"r_y1": 280.56,
"r_x2": 286.37,
"r_y2": 271.65,
"r_x3": 50.11,
"r_y3": 271.65,
"coord_origin": "TOPLEFT"
},
"text": "if it does not contain row spans or column spans. Addition-",
"orig": "if it does not contain row spans or column spans. Addition-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 292.51,
"r_x1": 286.37,
"r_y1": 292.51,
"r_x2": 286.37,
"r_y2": 283.61,
"r_x3": 50.11,
"r_y3": 283.61,
"coord_origin": "TOPLEFT"
},
"text": "ally, a table has a strict HTML structure if every row has the",
"orig": "ally, a table has a strict HTML structure if every row has the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 304.47,
"r_x1": 286.37,
"r_y1": 304.47,
"r_x2": 286.37,
"r_y2": 295.56,
"r_x3": 50.11,
"r_y3": 295.56,
"coord_origin": "TOPLEFT"
},
"text": "same number of columns after taking into account any row",
"orig": "same number of columns after taking into account any row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 316.42,
"r_x1": 286.37,
"r_y1": 316.42,
"r_x2": 286.37,
"r_y2": 307.52,
"r_x3": 50.11,
"r_y3": 307.52,
"coord_origin": "TOPLEFT"
},
"text": "or column spans. Therefore a strict HTML structure looks",
"orig": "or column spans. Therefore a strict HTML structure looks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 328.38,
"r_x1": 286.37,
"r_y1": 328.38,
"r_x2": 286.37,
"r_y2": 319.47,
"r_x3": 50.11,
"r_y3": 319.47,
"coord_origin": "TOPLEFT"
},
"text": "always rectangular. However, HTML is a lenient encoding",
"orig": "always rectangular. However, HTML is a lenient encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 340.33,
"r_x1": 286.37,
"r_y1": 340.33,
"r_x2": 286.37,
"r_y2": 331.43,
"r_x3": 50.11,
"r_y3": 331.43,
"coord_origin": "TOPLEFT"
},
"text": "format, i.e. tables with rows of different sizes might still",
"orig": "format, i.e. tables with rows of different sizes might still",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 352.29,
"r_x1": 286.37,
"r_y1": 352.29,
"r_x2": 286.37,
"r_y2": 343.38,
"r_x3": 50.11,
"r_y3": 343.38,
"coord_origin": "TOPLEFT"
},
"text": "be regarded as correct due to implicit display rules. These",
"orig": "be regarded as correct due to implicit display rules. These",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 364.24,
"r_x1": 286.37,
"r_y1": 364.24,
"r_x2": 286.37,
"r_y2": 355.34,
"r_x3": 50.11,
"r_y3": 355.34,
"coord_origin": "TOPLEFT"
},
"text": "implicit rules leave room for ambiguity, which we want to",
"orig": "implicit rules leave room for ambiguity, which we want to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 376.2,
"r_x1": 286.37,
"r_y1": 376.2,
"r_x2": 286.37,
"r_y2": 367.29,
"r_x3": 50.11,
"r_y3": 367.29,
"coord_origin": "TOPLEFT"
},
"text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 388.15,
"r_x1": 230.8,
"r_y1": 388.15,
"r_x2": 230.8,
"r_y2": 379.25,
"r_x3": 50.11,
"r_y3": 379.25,
"coord_origin": "TOPLEFT"
},
"text": "where every row has exactly the same length.",
"orig": "where every row has exactly the same length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 400.31,
"r_x1": 286.36,
"r_y1": 400.31,
"r_x2": 286.36,
"r_y2": 391.41,
"r_x3": 62.07,
"r_y3": 391.41,
"coord_origin": "TOPLEFT"
},
"text": "We have developed a technique that tries to derive a",
"orig": "We have developed a technique that tries to derive a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 412.27,
"r_x1": 286.37,
"r_y1": 412.27,
"r_x2": 286.37,
"r_y2": 403.36,
"r_x3": 50.11,
"r_y3": 403.36,
"coord_origin": "TOPLEFT"
},
"text": "missing bounding box out of its neighbors. As a first step,",
"orig": "missing bounding box out of its neighbors. As a first step,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 424.22,
"r_x1": 286.37,
"r_y1": 424.22,
"r_x2": 286.37,
"r_y2": 415.32,
"r_x3": 50.11,
"r_y3": 415.32,
"coord_origin": "TOPLEFT"
},
"text": "we use the annotation data to generate the most fine-grained",
"orig": "we use the annotation data to generate the most fine-grained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 436.18,
"r_x1": 286.37,
"r_y1": 436.18,
"r_x2": 286.37,
"r_y2": 427.27,
"r_x3": 50.11,
"r_y3": 427.27,
"coord_origin": "TOPLEFT"
},
"text": "grid that covers the table structure. In case of strict HTML",
"orig": "grid that covers the table structure. In case of strict HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 448.13,
"r_x1": 286.37,
"r_y1": 448.13,
"r_x2": 286.37,
"r_y2": 439.23,
"r_x3": 50.11,
"r_y3": 439.23,
"coord_origin": "TOPLEFT"
},
"text": "tables, all grid squares are associated with some table cell",
"orig": "tables, all grid squares are associated with some table cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 460.09,
"r_x1": 286.37,
"r_y1": 460.09,
"r_x2": 286.37,
"r_y2": 451.18,
"r_x3": 50.11,
"r_y3": 451.18,
"coord_origin": "TOPLEFT"
},
"text": "and in the presence of table spans a cell extends across mul-",
"orig": "and in the presence of table spans a cell extends across mul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 472.04,
"r_x1": 286.37,
"r_y1": 472.04,
"r_x2": 286.37,
"r_y2": 463.14,
"r_x3": 50.11,
"r_y3": 463.14,
"coord_origin": "TOPLEFT"
},
"text": "tiple grid squares. When enough bounding boxes are known",
"orig": "tiple grid squares. When enough bounding boxes are known",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 484.0,
"r_x1": 286.37,
"r_y1": 484.0,
"r_x2": 286.37,
"r_y2": 475.09,
"r_x3": 50.11,
"r_y3": 475.09,
"coord_origin": "TOPLEFT"
},
"text": "for a rectangular table, it is possible to compute the geo-",
"orig": "for a rectangular table, it is possible to compute the geo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 495.95,
"r_x1": 286.37,
"r_y1": 495.95,
"r_x2": 286.37,
"r_y2": 487.05,
"r_x3": 50.11,
"r_y3": 487.05,
"coord_origin": "TOPLEFT"
},
"text": "metrical border lines between the grid rows and columns.",
"orig": "metrical border lines between the grid rows and columns.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 507.91,
"r_x1": 286.37,
"r_y1": 507.91,
"r_x2": 286.37,
"r_y2": 499.0,
"r_x3": 50.11,
"r_y3": 499.0,
"coord_origin": "TOPLEFT"
},
"text": "Eventually this information is used to generate the missing",
"orig": "Eventually this information is used to generate the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 519.86,
"r_x1": 286.37,
"r_y1": 519.86,
"r_x2": 286.37,
"r_y2": 510.96,
"r_x3": 50.11,
"r_y3": 510.96,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes. Additionally, the existence of unused grid",
"orig": "bounding boxes. Additionally, the existence of unused grid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 531.82,
"r_x1": 286.37,
"r_y1": 531.82,
"r_x2": 286.37,
"r_y2": 522.91,
"r_x3": 50.11,
"r_y3": 522.91,
"coord_origin": "TOPLEFT"
},
"text": "squares indicates that the table rows have unequal number",
"orig": "squares indicates that the table rows have unequal number",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 543.77,
"r_x1": 286.37,
"r_y1": 543.77,
"r_x2": 286.37,
"r_y2": 534.87,
"r_x3": 50.11,
"r_y3": 534.87,
"coord_origin": "TOPLEFT"
},
"text": "of columns and the overall structure is non-strict. The gen-",
"orig": "of columns and the overall structure is non-strict. The gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 555.73,
"r_x1": 286.37,
"r_y1": 555.73,
"r_x2": 286.37,
"r_y2": 546.82,
"r_x3": 50.11,
"r_y3": 546.82,
"coord_origin": "TOPLEFT"
},
"text": "eration of missing bounding boxes for non-strict HTML ta-",
"orig": "eration of missing bounding boxes for non-strict HTML ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 567.68,
"r_x1": 257.47,
"r_y1": 567.68,
"r_x2": 257.47,
"r_y2": 558.78,
"r_x3": 50.11,
"r_y3": 558.78,
"coord_origin": "TOPLEFT"
},
"text": "bles is ambiguous and therefore quite challenging.",
"orig": "bles is ambiguous and therefore quite challenging.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.95,
"r_y0": 567.68,
"r_x1": 286.37,
"r_y1": 567.68,
"r_x2": 286.37,
"r_y2": 558.78,
"r_x3": 263.95,
"r_y3": 558.78,
"coord_origin": "TOPLEFT"
},
"text": "Thus,",
"orig": "Thus,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 579.64,
"r_x1": 286.37,
"r_y1": 579.64,
"r_x2": 286.37,
"r_y2": 570.73,
"r_x3": 50.11,
"r_y3": 570.73,
"coord_origin": "TOPLEFT"
},
"text": "we have decided to simply discard those tables. In case of",
"orig": "we have decided to simply discard those tables. In case of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 591.59,
"r_x1": 286.37,
"r_y1": 591.59,
"r_x2": 286.37,
"r_y2": 582.69,
"r_x3": 50.11,
"r_y3": 582.69,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet we have computed missing bounding boxes for",
"orig": "PubTabNet we have computed missing bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 603.55,
"r_x1": 286.37,
"r_y1": 603.55,
"r_x2": 286.37,
"r_y2": 594.64,
"r_x3": 50.11,
"r_y3": 594.64,
"coord_origin": "TOPLEFT"
},
"text": "48% of the simple and 69% of the complex tables. Regard-",
"orig": "48% of the simple and 69% of the complex tables. Regard-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 615.5,
"r_x1": 286.37,
"r_y1": 615.5,
"r_x2": 286.37,
"r_y2": 606.6,
"r_x3": 50.11,
"r_y3": 606.6,
"coord_origin": "TOPLEFT"
},
"text": "ing FinTabNet, 68% of the simple and 98% of the complex",
"orig": "ing FinTabNet, 68% of the simple and 98% of the complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 627.46,
"r_x1": 242.26,
"r_y1": 627.46,
"r_x2": 242.26,
"r_y2": 618.55,
"r_x3": 50.11,
"r_y3": 618.55,
"coord_origin": "TOPLEFT"
},
"text": "tables require the generation of bounding boxes.",
"orig": "tables require the generation of bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 639.62,
"r_x1": 286.36,
"r_y1": 639.62,
"r_x2": 286.36,
"r_y2": 630.71,
"r_x3": 62.07,
"r_y3": 630.71,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7 illustrates the distribution of the tables across",
"orig": "Figure 7 illustrates the distribution of the tables across",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 651.57,
"r_x1": 179.9,
"r_y1": 651.57,
"r_x2": 179.9,
"r_y2": 642.67,
"r_x3": 50.11,
"r_y3": 642.67,
"coord_origin": "TOPLEFT"
},
"text": "different dimensions per dataset.",
"orig": "different dimensions per dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 672.24,
"r_x1": 64.3,
"r_y1": 672.24,
"r_x2": 64.3,
"r_y2": 662.39,
"r_x3": 50.11,
"r_y3": 662.39,
"coord_origin": "TOPLEFT"
},
"text": "1.2.",
"orig": "1.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.75,
"r_y0": 672.24,
"r_x1": 153.61,
"r_y1": 672.24,
"r_x2": 153.61,
"r_y2": 662.39,
"r_x3": 73.75,
"r_y3": 662.39,
"coord_origin": "TOPLEFT"
},
"text": "Synthetic datasets",
"orig": "Synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 690.24,
"r_x1": 286.36,
"r_y1": 690.24,
"r_x2": 286.36,
"r_y2": 681.33,
"r_x3": 62.07,
"r_y3": 681.33,
"coord_origin": "TOPLEFT"
},
"text": "Aiming to train and evaluate our models in a broader",
"orig": "Aiming to train and evaluate our models in a broader",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 702.19,
"r_x1": 286.37,
"r_y1": 702.19,
"r_x2": 286.37,
"r_y2": 693.29,
"r_x3": 50.11,
"r_y3": 693.29,
"coord_origin": "TOPLEFT"
},
"text": "spectrum of table data we have synthesized four types of",
"orig": "spectrum of table data we have synthesized four types of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 714.15,
"r_x1": 84.14,
"r_y1": 714.15,
"r_x2": 84.14,
"r_y2": 705.24,
"r_x3": 50.11,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "datasets.",
"orig": "datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.24,
"r_y0": 714.15,
"r_x1": 286.37,
"r_y1": 714.15,
"r_x2": 286.37,
"r_y2": 705.24,
"r_x3": 91.24,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "Each one contains tables with different appear-",
"orig": "Each one contains tables with different appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 171.56,
"r_x1": 545.12,
"r_y1": 171.56,
"r_x2": 545.12,
"r_y2": 162.66,
"r_x3": 308.86,
"r_y3": 162.66,
"coord_origin": "TOPLEFT"
},
"text": "ances in regard to their size, structure, style and content.",
"orig": "ances in regard to their size, structure, style and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 183.52,
"r_x1": 545.12,
"r_y1": 183.52,
"r_x2": 545.12,
"r_y2": 174.61,
"r_x3": 308.86,
"r_y3": 174.61,
"coord_origin": "TOPLEFT"
},
"text": "Every synthetic dataset contains 150k examples, summing",
"orig": "Every synthetic dataset contains 150k examples, summing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 195.47,
"r_x1": 545.12,
"r_y1": 195.47,
"r_x2": 545.12,
"r_y2": 186.57,
"r_x3": 308.86,
"r_y3": 186.57,
"coord_origin": "TOPLEFT"
},
"text": "up to 600k synthetic examples. All datasets are divided into",
"orig": "up to 600k synthetic examples. All datasets are divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 207.43,
"r_x1": 484.07,
"r_y1": 207.43,
"r_x2": 484.07,
"r_y2": 198.52,
"r_x3": 308.86,
"r_y3": 198.52,
"coord_origin": "TOPLEFT"
},
"text": "Train, Test and Val splits (80%, 10%, 10%).",
"orig": "Train, Test and Val splits (80%, 10%, 10%).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 220.14,
"r_x1": 545.12,
"r_y1": 220.14,
"r_x2": 545.12,
"r_y2": 211.24,
"r_x3": 320.82,
"r_y3": 211.24,
"coord_origin": "TOPLEFT"
},
"text": "The process of generating a synthetic dataset can be de-",
"orig": "The process of generating a synthetic dataset can be de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 232.1,
"r_x1": 448.09,
"r_y1": 232.1,
"r_x2": 448.09,
"r_y2": 223.19,
"r_x3": 308.86,
"r_y3": 223.19,
"coord_origin": "TOPLEFT"
},
"text": "composed into the following steps:",
"orig": "composed into the following steps:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 244.81,
"r_x1": 328.29,
"r_y1": 244.81,
"r_x2": 328.29,
"r_y2": 235.91,
"r_x3": 320.82,
"r_y3": 235.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.38,
"r_y0": 244.81,
"r_x1": 545.11,
"r_y1": 244.81,
"r_x2": 545.11,
"r_y2": 235.91,
"r_x3": 335.38,
"r_y3": 235.91,
"coord_origin": "TOPLEFT"
},
"text": "Prepare styling and content templates: The styling",
"orig": "Prepare styling and content templates: The styling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 256.77,
"r_x1": 545.12,
"r_y1": 256.77,
"r_x2": 545.12,
"r_y2": 247.86,
"r_x3": 308.86,
"r_y3": 247.86,
"coord_origin": "TOPLEFT"
},
"text": "templates have been manually designed and organized into",
"orig": "templates have been manually designed and organized into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 268.72,
"r_x1": 545.12,
"r_y1": 268.72,
"r_x2": 545.12,
"r_y2": 259.82,
"r_x3": 308.86,
"r_y3": 259.82,
"coord_origin": "TOPLEFT"
},
"text": "groups of scope specific appearances (e.g. financial data,",
"orig": "groups of scope specific appearances (e.g. financial data,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 280.68,
"r_x1": 393.38,
"r_y1": 280.68,
"r_x2": 393.38,
"r_y2": 271.77,
"r_x3": 308.86,
"r_y3": 271.77,
"coord_origin": "TOPLEFT"
},
"text": "marketing data, etc.)",
"orig": "marketing data, etc.)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.12,
"r_y0": 280.68,
"r_x1": 545.12,
"r_y1": 280.68,
"r_x2": 545.12,
"r_y2": 271.77,
"r_x3": 400.12,
"r_y3": 271.77,
"coord_origin": "TOPLEFT"
},
"text": "Additionally, we have prepared cu-",
"orig": "Additionally, we have prepared cu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 292.63,
"r_x1": 545.12,
"r_y1": 292.63,
"r_x2": 545.12,
"r_y2": 283.73,
"r_x3": 308.86,
"r_y3": 283.73,
"coord_origin": "TOPLEFT"
},
"text": "rated collections of content templates by extracting the most",
"orig": "rated collections of content templates by extracting the most",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.59,
"r_x1": 545.12,
"r_y1": 304.59,
"r_x2": 545.12,
"r_y2": 295.68,
"r_x3": 308.86,
"r_y3": 295.68,
"coord_origin": "TOPLEFT"
},
"text": "frequently used terms out of non-synthetic datasets (e.g.",
"orig": "frequently used terms out of non-synthetic datasets (e.g.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.54,
"r_x1": 425.69,
"r_y1": 316.54,
"r_x2": 425.69,
"r_y2": 307.64,
"r_x3": 308.86,
"r_y3": 307.64,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet, FinTabNet, etc.).",
"orig": "PubTabNet, FinTabNet, etc.).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 329.26,
"r_x1": 328.49,
"r_y1": 329.26,
"r_x2": 328.49,
"r_y2": 320.35,
"r_x3": 320.82,
"r_y3": 320.35,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.05,
"r_y0": 329.26,
"r_x1": 545.11,
"r_y1": 329.26,
"r_x2": 545.11,
"r_y2": 320.35,
"r_x3": 331.05,
"r_y3": 320.35,
"coord_origin": "TOPLEFT"
},
"text": "Generate table structures: The structure of each syn-",
"orig": "Generate table structures: The structure of each syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 341.21,
"r_x1": 545.12,
"r_y1": 341.21,
"r_x2": 545.12,
"r_y2": 332.31,
"r_x3": 308.86,
"r_y3": 332.31,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset assumes a horizontal table header which po-",
"orig": "thetic dataset assumes a horizontal table header which po-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 353.17,
"r_x1": 545.12,
"r_y1": 353.17,
"r_x2": 545.12,
"r_y2": 344.26,
"r_x3": 308.86,
"r_y3": 344.26,
"coord_origin": "TOPLEFT"
},
"text": "tentially spans over multiple rows and a table body that",
"orig": "tentially spans over multiple rows and a table body that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 365.12,
"r_x1": 545.12,
"r_y1": 365.12,
"r_x2": 545.12,
"r_y2": 356.22,
"r_x3": 308.86,
"r_y3": 356.22,
"coord_origin": "TOPLEFT"
},
"text": "may contain a combination of row spans and column spans.",
"orig": "may contain a combination of row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 377.08,
"r_x1": 545.12,
"r_y1": 377.08,
"r_x2": 545.12,
"r_y2": 368.17,
"r_x3": 308.86,
"r_y3": 368.17,
"coord_origin": "TOPLEFT"
},
"text": "However, spans are not allowed to cross the header - body",
"orig": "However, spans are not allowed to cross the header - body",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 389.03,
"r_x1": 545.11,
"r_y1": 389.03,
"r_x2": 545.11,
"r_y2": 380.13,
"r_x3": 308.86,
"r_y3": 380.13,
"coord_origin": "TOPLEFT"
},
"text": "boundary. The table structure is described by the parame-",
"orig": "boundary. The table structure is described by the parame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.99,
"r_x1": 545.12,
"r_y1": 400.99,
"r_x2": 545.12,
"r_y2": 392.08,
"r_x3": 308.86,
"r_y3": 392.08,
"coord_origin": "TOPLEFT"
},
"text": "ters: Total number of table rows and columns, number of",
"orig": "ters: Total number of table rows and columns, number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.94,
"r_x1": 545.12,
"r_y1": 412.94,
"r_x2": 545.12,
"r_y2": 404.04,
"r_x3": 308.86,
"r_y3": 404.04,
"coord_origin": "TOPLEFT"
},
"text": "header rows, type of spans (header only spans, row only",
"orig": "header rows, type of spans (header only spans, row only",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.9,
"r_x1": 545.11,
"r_y1": 424.9,
"r_x2": 545.11,
"r_y2": 415.99,
"r_x3": 308.86,
"r_y3": 415.99,
"coord_origin": "TOPLEFT"
},
"text": "spans, column only spans, both row and column spans),",
"orig": "spans, column only spans, both row and column spans),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.85,
"r_x1": 545.12,
"r_y1": 436.85,
"r_x2": 545.12,
"r_y2": 427.95,
"r_x3": 308.86,
"r_y3": 427.95,
"coord_origin": "TOPLEFT"
},
"text": "maximum span size and the ratio of the table area covered",
"orig": "maximum span size and the ratio of the table area covered",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.81,
"r_x1": 345.94,
"r_y1": 448.81,
"r_x2": 345.94,
"r_y2": 439.9,
"r_x3": 308.86,
"r_y3": 439.9,
"coord_origin": "TOPLEFT"
},
"text": "by spans.",
"orig": "by spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 461.52,
"r_x1": 328.3,
"r_y1": 461.52,
"r_x2": 328.3,
"r_y2": 452.62,
"r_x3": 320.82,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.8,
"r_y0": 461.52,
"r_x1": 485.76,
"r_y1": 461.52,
"r_x2": 485.76,
"r_y2": 452.62,
"r_x3": 330.8,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": "Generate content: Based on the dataset",
"orig": "Generate content: Based on the dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.07,
"r_y0": 461.29,
"r_x1": 511.86,
"r_y1": 461.29,
"r_x2": 511.86,
"r_y2": 452.71,
"r_x3": 488.07,
"r_y3": 452.71,
"coord_origin": "TOPLEFT"
},
"text": "theme",
"orig": "theme",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.86,
"r_y0": 461.52,
"r_x1": 545.11,
"r_y1": 461.52,
"r_x2": 545.11,
"r_y2": 452.62,
"r_x3": 511.86,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": ", a set of",
"orig": ", a set of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 473.48,
"r_x1": 545.12,
"r_y1": 473.48,
"r_x2": 545.12,
"r_y2": 464.57,
"r_x3": 308.86,
"r_y3": 464.57,
"coord_origin": "TOPLEFT"
},
"text": "suitable content templates is chosen first. Then, this content",
"orig": "suitable content templates is chosen first. Then, this content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 485.43,
"r_x1": 545.12,
"r_y1": 485.43,
"r_x2": 545.12,
"r_y2": 476.53,
"r_x3": 308.86,
"r_y3": 476.53,
"coord_origin": "TOPLEFT"
},
"text": "can be combined with purely random text to produce the",
"orig": "can be combined with purely random text to produce the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.39,
"r_x1": 379.15,
"r_y1": 497.39,
"r_x2": 379.15,
"r_y2": 488.48,
"r_x3": 308.86,
"r_y3": 488.48,
"coord_origin": "TOPLEFT"
},
"text": "synthetic content.",
"orig": "synthetic content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 510.1,
"r_x1": 328.66,
"r_y1": 510.1,
"r_x2": 328.66,
"r_y2": 501.2,
"r_x3": 320.82,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.28,
"r_y0": 510.1,
"r_x1": 545.11,
"r_y1": 510.1,
"r_x2": 545.11,
"r_y2": 501.2,
"r_x3": 331.28,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "Apply styling templates: Depending on the domain",
"orig": "Apply styling templates: Depending on the domain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 522.06,
"r_x1": 545.12,
"r_y1": 522.06,
"r_x2": 545.12,
"r_y2": 513.15,
"r_x3": 308.86,
"r_y3": 513.15,
"coord_origin": "TOPLEFT"
},
"text": "of the synthetic dataset, a set of styling templates is first",
"orig": "of the synthetic dataset, a set of styling templates is first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 534.01,
"r_x1": 384.3,
"r_y1": 534.01,
"r_x2": 384.3,
"r_y2": 525.11,
"r_x3": 308.86,
"r_y3": 525.11,
"coord_origin": "TOPLEFT"
},
"text": "manually selected.",
"orig": "manually selected.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.25,
"r_y0": 534.01,
"r_x1": 545.12,
"r_y1": 534.01,
"r_x2": 545.12,
"r_y2": 525.11,
"r_x3": 391.25,
"r_y3": 525.11,
"coord_origin": "TOPLEFT"
},
"text": "Then, a style is randomly selected to",
"orig": "Then, a style is randomly selected to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.97,
"r_x1": 496.16,
"r_y1": 545.97,
"r_x2": 496.16,
"r_y2": 537.06,
"r_x3": 308.86,
"r_y3": 537.06,
"coord_origin": "TOPLEFT"
},
"text": "format the appearance of the synthesized table.",
"orig": "format the appearance of the synthesized table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 558.68,
"r_x1": 328.29,
"r_y1": 558.68,
"r_x2": 328.29,
"r_y2": 549.78,
"r_x3": 320.82,
"r_y3": 549.78,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 558.68,
"r_x1": 545.11,
"r_y1": 558.68,
"r_x2": 545.11,
"r_y2": 549.78,
"r_x3": 335.4,
"r_y3": 549.78,
"coord_origin": "TOPLEFT"
},
"text": "Render the complete tables: The synthetic table is",
"orig": "Render the complete tables: The synthetic table is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 570.64,
"r_x1": 545.12,
"r_y1": 570.64,
"r_x2": 545.12,
"r_y2": 561.73,
"r_x3": 308.86,
"r_y3": 561.73,
"coord_origin": "TOPLEFT"
},
"text": "finally rendered by a web browser engine to generate the",
"orig": "finally rendered by a web browser engine to generate the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 582.59,
"r_x1": 545.12,
"r_y1": 582.59,
"r_x2": 545.12,
"r_y2": 573.69,
"r_x3": 308.86,
"r_y3": 573.69,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes for each table cell. A batching technique is",
"orig": "bounding boxes for each table cell. A batching technique is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 594.55,
"r_x1": 545.12,
"r_y1": 594.55,
"r_x2": 545.12,
"r_y2": 585.64,
"r_x3": 308.86,
"r_y3": 585.64,
"coord_origin": "TOPLEFT"
},
"text": "utilized to optimize the runtime overhead of the rendering",
"orig": "utilized to optimize the runtime overhead of the rendering",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 606.5,
"r_x1": 341.23,
"r_y1": 606.5,
"r_x2": 341.23,
"r_y2": 597.6,
"r_x3": 308.86,
"r_y3": 597.6,
"coord_origin": "TOPLEFT"
},
"text": "process.",
"orig": "process.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 633.04,
"r_x1": 316.77,
"r_y1": 633.04,
"r_x2": 316.77,
"r_y2": 622.29,
"r_x3": 308.86,
"r_y3": 622.29,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.31,
"r_y0": 633.04,
"r_x1": 545.11,
"r_y1": 633.04,
"r_x2": 545.11,
"r_y2": 622.29,
"r_x3": 327.31,
"r_y3": 622.29,
"coord_origin": "TOPLEFT"
},
"text": "Prediction post-processing for PDF docu-",
"orig": "Prediction post-processing for PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 646.99,
"r_x1": 357.34,
"r_y1": 646.99,
"r_x2": 357.34,
"r_y2": 636.24,
"r_x3": 326.8,
"r_y3": 636.24,
"coord_origin": "TOPLEFT"
},
"text": "ments",
"orig": "ments",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 666.33,
"r_x1": 545.11,
"r_y1": 666.33,
"r_x2": 545.11,
"r_y2": 657.42,
"r_x3": 320.82,
"r_y3": 657.42,
"coord_origin": "TOPLEFT"
},
"text": "Although TableFormer can predict the table structure and",
"orig": "Although TableFormer can predict the table structure and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 678.28,
"r_x1": 545.12,
"r_y1": 678.28,
"r_x2": 545.12,
"r_y2": 669.38,
"r_x3": 308.86,
"r_y3": 669.38,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes for tables recognized inside PDF docu-",
"orig": "the bounding boxes for tables recognized inside PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 690.24,
"r_x1": 545.12,
"r_y1": 690.24,
"r_x2": 545.12,
"r_y2": 681.33,
"r_x3": 308.86,
"r_y3": 681.33,
"coord_origin": "TOPLEFT"
},
"text": "ments, this is not enough when a full reconstruction of the",
"orig": "ments, this is not enough when a full reconstruction of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 702.19,
"r_x1": 545.12,
"r_y1": 702.19,
"r_x2": 545.12,
"r_y2": 693.29,
"r_x3": 308.86,
"r_y3": 693.29,
"coord_origin": "TOPLEFT"
},
"text": "original table is required. This happens mainly due the fol-",
"orig": "original table is required. This happens mainly due the fol-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 714.15,
"r_x1": 371.43,
"r_y1": 714.15,
"r_x2": 371.43,
"r_y2": 705.24,
"r_x3": 308.86,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "lowing reasons:",
"orig": "lowing reasons:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 18,
"label": "section_header",
"bbox": {
"l": 132.84,
"t": 110.57,
"r": 465.38,
"b": 135.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.84,
"r_y0": 121.32,
"r_x1": 465.38,
"r_y1": 121.32,
"r_x2": 465.38,
"r_y2": 110.57,
"r_x3": 132.84,
"r_y3": 110.57,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers",
"orig": "TableFormer: Table Structure Understanding with Transformers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.18,
"r_y0": 135.53,
"r_x1": 375.04,
"r_y1": 135.53,
"r_x2": 375.04,
"r_y2": 122.26,
"r_x3": 220.18,
"r_y3": 122.26,
"coord_origin": "TOPLEFT"
},
"text": "Supplementary Material",
"orig": "Supplementary Material",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 161.16,
"r": 175.96,
"b": 171.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 171.91,
"r_x1": 57.09,
"r_y1": 171.91,
"r_x2": 57.09,
"r_y2": 161.16,
"r_x3": 50.11,
"r_y3": 161.16,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.39,
"r_y0": 171.91,
"r_x1": 175.96,
"r_y1": 171.91,
"r_x2": 175.96,
"r_y2": 161.16,
"r_x3": 66.39,
"r_y3": 161.16,
"coord_origin": "TOPLEFT"
},
"text": "Details on the datasets",
"orig": "Details on the datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 180.98,
"r": 150.36,
"b": 190.83,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 190.83,
"r_x1": 64.21,
"r_y1": 190.83,
"r_x2": 64.21,
"r_y2": 180.98,
"r_x3": 50.11,
"r_y3": 180.98,
"coord_origin": "TOPLEFT"
},
"text": "1.1.",
"orig": "1.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.61,
"r_y0": 190.83,
"r_x1": 150.36,
"r_y1": 190.83,
"r_x2": 150.36,
"r_y2": 180.98,
"r_x3": 73.61,
"r_y3": 180.98,
"coord_origin": "TOPLEFT"
},
"text": "Data preparation",
"orig": "Data preparation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 199.92,
"r": 286.37,
"b": 388.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 208.83,
"r_x1": 286.36,
"r_y1": 208.83,
"r_x2": 286.36,
"r_y2": 199.92,
"r_x3": 62.07,
"r_y3": 199.92,
"coord_origin": "TOPLEFT"
},
"text": "As a first step of our data preparation process, we have",
"orig": "As a first step of our data preparation process, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 220.78,
"r_x1": 286.37,
"r_y1": 220.78,
"r_x2": 286.37,
"r_y2": 211.88,
"r_x3": 50.11,
"r_y3": 211.88,
"coord_origin": "TOPLEFT"
},
"text": "calculated statistics over the datasets across the following",
"orig": "calculated statistics over the datasets across the following",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 232.74,
"r_x1": 286.37,
"r_y1": 232.74,
"r_x2": 286.37,
"r_y2": 223.83,
"r_x3": 50.11,
"r_y3": 223.83,
"coord_origin": "TOPLEFT"
},
"text": "dimensions: (1) table size measured in the number of rows",
"orig": "dimensions: (1) table size measured in the number of rows",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 244.69,
"r_x1": 286.37,
"r_y1": 244.69,
"r_x2": 286.37,
"r_y2": 235.79,
"r_x3": 50.11,
"r_y3": 235.79,
"coord_origin": "TOPLEFT"
},
"text": "and columns, (2) complexity of the table, (3) strictness of",
"orig": "and columns, (2) complexity of the table, (3) strictness of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 256.65,
"r_x1": 286.37,
"r_y1": 256.65,
"r_x2": 286.37,
"r_y2": 247.74,
"r_x3": 50.11,
"r_y3": 247.74,
"coord_origin": "TOPLEFT"
},
"text": "the provided HTML structure and (4) completeness (i.e. no",
"orig": "the provided HTML structure and (4) completeness (i.e. no",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 268.6,
"r_x1": 286.37,
"r_y1": 268.6,
"r_x2": 286.37,
"r_y2": 259.7,
"r_x3": 50.11,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "omitted bounding boxes). A table is considered to be simple",
"orig": "omitted bounding boxes). A table is considered to be simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 280.56,
"r_x1": 286.37,
"r_y1": 280.56,
"r_x2": 286.37,
"r_y2": 271.65,
"r_x3": 50.11,
"r_y3": 271.65,
"coord_origin": "TOPLEFT"
},
"text": "if it does not contain row spans or column spans. Addition-",
"orig": "if it does not contain row spans or column spans. Addition-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 292.51,
"r_x1": 286.37,
"r_y1": 292.51,
"r_x2": 286.37,
"r_y2": 283.61,
"r_x3": 50.11,
"r_y3": 283.61,
"coord_origin": "TOPLEFT"
},
"text": "ally, a table has a strict HTML structure if every row has the",
"orig": "ally, a table has a strict HTML structure if every row has the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 304.47,
"r_x1": 286.37,
"r_y1": 304.47,
"r_x2": 286.37,
"r_y2": 295.56,
"r_x3": 50.11,
"r_y3": 295.56,
"coord_origin": "TOPLEFT"
},
"text": "same number of columns after taking into account any row",
"orig": "same number of columns after taking into account any row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 316.42,
"r_x1": 286.37,
"r_y1": 316.42,
"r_x2": 286.37,
"r_y2": 307.52,
"r_x3": 50.11,
"r_y3": 307.52,
"coord_origin": "TOPLEFT"
},
"text": "or column spans. Therefore a strict HTML structure looks",
"orig": "or column spans. Therefore a strict HTML structure looks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 328.38,
"r_x1": 286.37,
"r_y1": 328.38,
"r_x2": 286.37,
"r_y2": 319.47,
"r_x3": 50.11,
"r_y3": 319.47,
"coord_origin": "TOPLEFT"
},
"text": "always rectangular. However, HTML is a lenient encoding",
"orig": "always rectangular. However, HTML is a lenient encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 340.33,
"r_x1": 286.37,
"r_y1": 340.33,
"r_x2": 286.37,
"r_y2": 331.43,
"r_x3": 50.11,
"r_y3": 331.43,
"coord_origin": "TOPLEFT"
},
"text": "format, i.e. tables with rows of different sizes might still",
"orig": "format, i.e. tables with rows of different sizes might still",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 352.29,
"r_x1": 286.37,
"r_y1": 352.29,
"r_x2": 286.37,
"r_y2": 343.38,
"r_x3": 50.11,
"r_y3": 343.38,
"coord_origin": "TOPLEFT"
},
"text": "be regarded as correct due to implicit display rules. These",
"orig": "be regarded as correct due to implicit display rules. These",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 364.24,
"r_x1": 286.37,
"r_y1": 364.24,
"r_x2": 286.37,
"r_y2": 355.34,
"r_x3": 50.11,
"r_y3": 355.34,
"coord_origin": "TOPLEFT"
},
"text": "implicit rules leave room for ambiguity, which we want to",
"orig": "implicit rules leave room for ambiguity, which we want to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 376.2,
"r_x1": 286.37,
"r_y1": 376.2,
"r_x2": 286.37,
"r_y2": 367.29,
"r_x3": 50.11,
"r_y3": 367.29,
"coord_origin": "TOPLEFT"
},
"text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 388.15,
"r_x1": 230.8,
"r_y1": 388.15,
"r_x2": 230.8,
"r_y2": 379.25,
"r_x3": 50.11,
"r_y3": 379.25,
"coord_origin": "TOPLEFT"
},
"text": "where every row has exactly the same length.",
"orig": "where every row has exactly the same length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 391.41,
"r": 286.37,
"b": 627.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 400.31,
"r_x1": 286.36,
"r_y1": 400.31,
"r_x2": 286.36,
"r_y2": 391.41,
"r_x3": 62.07,
"r_y3": 391.41,
"coord_origin": "TOPLEFT"
},
"text": "We have developed a technique that tries to derive a",
"orig": "We have developed a technique that tries to derive a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 412.27,
"r_x1": 286.37,
"r_y1": 412.27,
"r_x2": 286.37,
"r_y2": 403.36,
"r_x3": 50.11,
"r_y3": 403.36,
"coord_origin": "TOPLEFT"
},
"text": "missing bounding box out of its neighbors. As a first step,",
"orig": "missing bounding box out of its neighbors. As a first step,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 424.22,
"r_x1": 286.37,
"r_y1": 424.22,
"r_x2": 286.37,
"r_y2": 415.32,
"r_x3": 50.11,
"r_y3": 415.32,
"coord_origin": "TOPLEFT"
},
"text": "we use the annotation data to generate the most fine-grained",
"orig": "we use the annotation data to generate the most fine-grained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 436.18,
"r_x1": 286.37,
"r_y1": 436.18,
"r_x2": 286.37,
"r_y2": 427.27,
"r_x3": 50.11,
"r_y3": 427.27,
"coord_origin": "TOPLEFT"
},
"text": "grid that covers the table structure. In case of strict HTML",
"orig": "grid that covers the table structure. In case of strict HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 448.13,
"r_x1": 286.37,
"r_y1": 448.13,
"r_x2": 286.37,
"r_y2": 439.23,
"r_x3": 50.11,
"r_y3": 439.23,
"coord_origin": "TOPLEFT"
},
"text": "tables, all grid squares are associated with some table cell",
"orig": "tables, all grid squares are associated with some table cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 460.09,
"r_x1": 286.37,
"r_y1": 460.09,
"r_x2": 286.37,
"r_y2": 451.18,
"r_x3": 50.11,
"r_y3": 451.18,
"coord_origin": "TOPLEFT"
},
"text": "and in the presence of table spans a cell extends across mul-",
"orig": "and in the presence of table spans a cell extends across mul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 472.04,
"r_x1": 286.37,
"r_y1": 472.04,
"r_x2": 286.37,
"r_y2": 463.14,
"r_x3": 50.11,
"r_y3": 463.14,
"coord_origin": "TOPLEFT"
},
"text": "tiple grid squares. When enough bounding boxes are known",
"orig": "tiple grid squares. When enough bounding boxes are known",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 484.0,
"r_x1": 286.37,
"r_y1": 484.0,
"r_x2": 286.37,
"r_y2": 475.09,
"r_x3": 50.11,
"r_y3": 475.09,
"coord_origin": "TOPLEFT"
},
"text": "for a rectangular table, it is possible to compute the geo-",
"orig": "for a rectangular table, it is possible to compute the geo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 495.95,
"r_x1": 286.37,
"r_y1": 495.95,
"r_x2": 286.37,
"r_y2": 487.05,
"r_x3": 50.11,
"r_y3": 487.05,
"coord_origin": "TOPLEFT"
},
"text": "metrical border lines between the grid rows and columns.",
"orig": "metrical border lines between the grid rows and columns.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 507.91,
"r_x1": 286.37,
"r_y1": 507.91,
"r_x2": 286.37,
"r_y2": 499.0,
"r_x3": 50.11,
"r_y3": 499.0,
"coord_origin": "TOPLEFT"
},
"text": "Eventually this information is used to generate the missing",
"orig": "Eventually this information is used to generate the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 519.86,
"r_x1": 286.37,
"r_y1": 519.86,
"r_x2": 286.37,
"r_y2": 510.96,
"r_x3": 50.11,
"r_y3": 510.96,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes. Additionally, the existence of unused grid",
"orig": "bounding boxes. Additionally, the existence of unused grid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 531.82,
"r_x1": 286.37,
"r_y1": 531.82,
"r_x2": 286.37,
"r_y2": 522.91,
"r_x3": 50.11,
"r_y3": 522.91,
"coord_origin": "TOPLEFT"
},
"text": "squares indicates that the table rows have unequal number",
"orig": "squares indicates that the table rows have unequal number",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 543.77,
"r_x1": 286.37,
"r_y1": 543.77,
"r_x2": 286.37,
"r_y2": 534.87,
"r_x3": 50.11,
"r_y3": 534.87,
"coord_origin": "TOPLEFT"
},
"text": "of columns and the overall structure is non-strict. The gen-",
"orig": "of columns and the overall structure is non-strict. The gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 555.73,
"r_x1": 286.37,
"r_y1": 555.73,
"r_x2": 286.37,
"r_y2": 546.82,
"r_x3": 50.11,
"r_y3": 546.82,
"coord_origin": "TOPLEFT"
},
"text": "eration of missing bounding boxes for non-strict HTML ta-",
"orig": "eration of missing bounding boxes for non-strict HTML ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 567.68,
"r_x1": 257.47,
"r_y1": 567.68,
"r_x2": 257.47,
"r_y2": 558.78,
"r_x3": 50.11,
"r_y3": 558.78,
"coord_origin": "TOPLEFT"
},
"text": "bles is ambiguous and therefore quite challenging.",
"orig": "bles is ambiguous and therefore quite challenging.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.95,
"r_y0": 567.68,
"r_x1": 286.37,
"r_y1": 567.68,
"r_x2": 286.37,
"r_y2": 558.78,
"r_x3": 263.95,
"r_y3": 558.78,
"coord_origin": "TOPLEFT"
},
"text": "Thus,",
"orig": "Thus,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 579.64,
"r_x1": 286.37,
"r_y1": 579.64,
"r_x2": 286.37,
"r_y2": 570.73,
"r_x3": 50.11,
"r_y3": 570.73,
"coord_origin": "TOPLEFT"
},
"text": "we have decided to simply discard those tables. In case of",
"orig": "we have decided to simply discard those tables. In case of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 591.59,
"r_x1": 286.37,
"r_y1": 591.59,
"r_x2": 286.37,
"r_y2": 582.69,
"r_x3": 50.11,
"r_y3": 582.69,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet we have computed missing bounding boxes for",
"orig": "PubTabNet we have computed missing bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 603.55,
"r_x1": 286.37,
"r_y1": 603.55,
"r_x2": 286.37,
"r_y2": 594.64,
"r_x3": 50.11,
"r_y3": 594.64,
"coord_origin": "TOPLEFT"
},
"text": "48% of the simple and 69% of the complex tables. Regard-",
"orig": "48% of the simple and 69% of the complex tables. Regard-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 615.5,
"r_x1": 286.37,
"r_y1": 615.5,
"r_x2": 286.37,
"r_y2": 606.6,
"r_x3": 50.11,
"r_y3": 606.6,
"coord_origin": "TOPLEFT"
},
"text": "ing FinTabNet, 68% of the simple and 98% of the complex",
"orig": "ing FinTabNet, 68% of the simple and 98% of the complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 627.46,
"r_x1": 242.26,
"r_y1": 627.46,
"r_x2": 242.26,
"r_y2": 618.55,
"r_x3": 50.11,
"r_y3": 618.55,
"coord_origin": "TOPLEFT"
},
"text": "tables require the generation of bounding boxes.",
"orig": "tables require the generation of bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "text",
"bbox": {
"l": 50.11,
"t": 630.71,
"r": 286.36,
"b": 651.57,
"coord_origin": "TOPLEFT"
},
"confidence": 0.934,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 639.62,
"r_x1": 286.36,
"r_y1": 639.62,
"r_x2": 286.36,
"r_y2": 630.71,
"r_x3": 62.07,
"r_y3": 630.71,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7 illustrates the distribution of the tables across",
"orig": "Figure 7 illustrates the distribution of the tables across",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 651.57,
"r_x1": 179.9,
"r_y1": 651.57,
"r_x2": 179.9,
"r_y2": 642.67,
"r_x3": 50.11,
"r_y3": 642.67,
"coord_origin": "TOPLEFT"
},
"text": "different dimensions per dataset.",
"orig": "different dimensions per dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 662.39,
"r": 153.61,
"b": 672.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.952,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 672.24,
"r_x1": 64.3,
"r_y1": 672.24,
"r_x2": 64.3,
"r_y2": 662.39,
"r_x3": 50.11,
"r_y3": 662.39,
"coord_origin": "TOPLEFT"
},
"text": "1.2.",
"orig": "1.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.75,
"r_y0": 672.24,
"r_x1": 153.61,
"r_y1": 672.24,
"r_x2": 153.61,
"r_y2": 662.39,
"r_x3": 73.75,
"r_y3": 662.39,
"coord_origin": "TOPLEFT"
},
"text": "Synthetic datasets",
"orig": "Synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 681.33,
"r": 286.37,
"b": 714.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 690.24,
"r_x1": 286.36,
"r_y1": 690.24,
"r_x2": 286.36,
"r_y2": 681.33,
"r_x3": 62.07,
"r_y3": 681.33,
"coord_origin": "TOPLEFT"
},
"text": "Aiming to train and evaluate our models in a broader",
"orig": "Aiming to train and evaluate our models in a broader",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 702.19,
"r_x1": 286.37,
"r_y1": 702.19,
"r_x2": 286.37,
"r_y2": 693.29,
"r_x3": 50.11,
"r_y3": 693.29,
"coord_origin": "TOPLEFT"
},
"text": "spectrum of table data we have synthesized four types of",
"orig": "spectrum of table data we have synthesized four types of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 714.15,
"r_x1": 84.14,
"r_y1": 714.15,
"r_x2": 84.14,
"r_y2": 705.24,
"r_x3": 50.11,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "datasets.",
"orig": "datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.24,
"r_y0": 714.15,
"r_x1": 286.37,
"r_y1": 714.15,
"r_x2": 286.37,
"r_y2": 705.24,
"r_x3": 91.24,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "Each one contains tables with different appear-",
"orig": "Each one contains tables with different appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "text",
"bbox": {
"l": 308.86,
"t": 162.66,
"r": 545.12,
"b": 207.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 171.56,
"r_x1": 545.12,
"r_y1": 171.56,
"r_x2": 545.12,
"r_y2": 162.66,
"r_x3": 308.86,
"r_y3": 162.66,
"coord_origin": "TOPLEFT"
},
"text": "ances in regard to their size, structure, style and content.",
"orig": "ances in regard to their size, structure, style and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 183.52,
"r_x1": 545.12,
"r_y1": 183.52,
"r_x2": 545.12,
"r_y2": 174.61,
"r_x3": 308.86,
"r_y3": 174.61,
"coord_origin": "TOPLEFT"
},
"text": "Every synthetic dataset contains 150k examples, summing",
"orig": "Every synthetic dataset contains 150k examples, summing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 195.47,
"r_x1": 545.12,
"r_y1": 195.47,
"r_x2": 545.12,
"r_y2": 186.57,
"r_x3": 308.86,
"r_y3": 186.57,
"coord_origin": "TOPLEFT"
},
"text": "up to 600k synthetic examples. All datasets are divided into",
"orig": "up to 600k synthetic examples. All datasets are divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 207.43,
"r_x1": 484.07,
"r_y1": 207.43,
"r_x2": 484.07,
"r_y2": 198.52,
"r_x3": 308.86,
"r_y3": 198.52,
"coord_origin": "TOPLEFT"
},
"text": "Train, Test and Val splits (80%, 10%, 10%).",
"orig": "Train, Test and Val splits (80%, 10%, 10%).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "text",
"bbox": {
"l": 308.86,
"t": 211.24,
"r": 545.12,
"b": 232.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 220.14,
"r_x1": 545.12,
"r_y1": 220.14,
"r_x2": 545.12,
"r_y2": 211.24,
"r_x3": 320.82,
"r_y3": 211.24,
"coord_origin": "TOPLEFT"
},
"text": "The process of generating a synthetic dataset can be de-",
"orig": "The process of generating a synthetic dataset can be de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 232.1,
"r_x1": 448.09,
"r_y1": 232.1,
"r_x2": 448.09,
"r_y2": 223.19,
"r_x3": 308.86,
"r_y3": 223.19,
"coord_origin": "TOPLEFT"
},
"text": "composed into the following steps:",
"orig": "composed into the following steps:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 235.91,
"r": 545.12,
"b": 316.54,
"coord_origin": "TOPLEFT"
},
"confidence": 0.964,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 244.81,
"r_x1": 328.29,
"r_y1": 244.81,
"r_x2": 328.29,
"r_y2": 235.91,
"r_x3": 320.82,
"r_y3": 235.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.38,
"r_y0": 244.81,
"r_x1": 545.11,
"r_y1": 244.81,
"r_x2": 545.11,
"r_y2": 235.91,
"r_x3": 335.38,
"r_y3": 235.91,
"coord_origin": "TOPLEFT"
},
"text": "Prepare styling and content templates: The styling",
"orig": "Prepare styling and content templates: The styling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 256.77,
"r_x1": 545.12,
"r_y1": 256.77,
"r_x2": 545.12,
"r_y2": 247.86,
"r_x3": 308.86,
"r_y3": 247.86,
"coord_origin": "TOPLEFT"
},
"text": "templates have been manually designed and organized into",
"orig": "templates have been manually designed and organized into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 268.72,
"r_x1": 545.12,
"r_y1": 268.72,
"r_x2": 545.12,
"r_y2": 259.82,
"r_x3": 308.86,
"r_y3": 259.82,
"coord_origin": "TOPLEFT"
},
"text": "groups of scope specific appearances (e.g. financial data,",
"orig": "groups of scope specific appearances (e.g. financial data,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 280.68,
"r_x1": 393.38,
"r_y1": 280.68,
"r_x2": 393.38,
"r_y2": 271.77,
"r_x3": 308.86,
"r_y3": 271.77,
"coord_origin": "TOPLEFT"
},
"text": "marketing data, etc.)",
"orig": "marketing data, etc.)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.12,
"r_y0": 280.68,
"r_x1": 545.12,
"r_y1": 280.68,
"r_x2": 545.12,
"r_y2": 271.77,
"r_x3": 400.12,
"r_y3": 271.77,
"coord_origin": "TOPLEFT"
},
"text": "Additionally, we have prepared cu-",
"orig": "Additionally, we have prepared cu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 292.63,
"r_x1": 545.12,
"r_y1": 292.63,
"r_x2": 545.12,
"r_y2": 283.73,
"r_x3": 308.86,
"r_y3": 283.73,
"coord_origin": "TOPLEFT"
},
"text": "rated collections of content templates by extracting the most",
"orig": "rated collections of content templates by extracting the most",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.59,
"r_x1": 545.12,
"r_y1": 304.59,
"r_x2": 545.12,
"r_y2": 295.68,
"r_x3": 308.86,
"r_y3": 295.68,
"coord_origin": "TOPLEFT"
},
"text": "frequently used terms out of non-synthetic datasets (e.g.",
"orig": "frequently used terms out of non-synthetic datasets (e.g.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.54,
"r_x1": 425.69,
"r_y1": 316.54,
"r_x2": 425.69,
"r_y2": 307.64,
"r_x3": 308.86,
"r_y3": 307.64,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet, FinTabNet, etc.).",
"orig": "PubTabNet, FinTabNet, etc.).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 320.35,
"r": 545.12,
"b": 448.81,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 329.26,
"r_x1": 328.49,
"r_y1": 329.26,
"r_x2": 328.49,
"r_y2": 320.35,
"r_x3": 320.82,
"r_y3": 320.35,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.05,
"r_y0": 329.26,
"r_x1": 545.11,
"r_y1": 329.26,
"r_x2": 545.11,
"r_y2": 320.35,
"r_x3": 331.05,
"r_y3": 320.35,
"coord_origin": "TOPLEFT"
},
"text": "Generate table structures: The structure of each syn-",
"orig": "Generate table structures: The structure of each syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 341.21,
"r_x1": 545.12,
"r_y1": 341.21,
"r_x2": 545.12,
"r_y2": 332.31,
"r_x3": 308.86,
"r_y3": 332.31,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset assumes a horizontal table header which po-",
"orig": "thetic dataset assumes a horizontal table header which po-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 353.17,
"r_x1": 545.12,
"r_y1": 353.17,
"r_x2": 545.12,
"r_y2": 344.26,
"r_x3": 308.86,
"r_y3": 344.26,
"coord_origin": "TOPLEFT"
},
"text": "tentially spans over multiple rows and a table body that",
"orig": "tentially spans over multiple rows and a table body that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 365.12,
"r_x1": 545.12,
"r_y1": 365.12,
"r_x2": 545.12,
"r_y2": 356.22,
"r_x3": 308.86,
"r_y3": 356.22,
"coord_origin": "TOPLEFT"
},
"text": "may contain a combination of row spans and column spans.",
"orig": "may contain a combination of row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 377.08,
"r_x1": 545.12,
"r_y1": 377.08,
"r_x2": 545.12,
"r_y2": 368.17,
"r_x3": 308.86,
"r_y3": 368.17,
"coord_origin": "TOPLEFT"
},
"text": "However, spans are not allowed to cross the header - body",
"orig": "However, spans are not allowed to cross the header - body",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 389.03,
"r_x1": 545.11,
"r_y1": 389.03,
"r_x2": 545.11,
"r_y2": 380.13,
"r_x3": 308.86,
"r_y3": 380.13,
"coord_origin": "TOPLEFT"
},
"text": "boundary. The table structure is described by the parame-",
"orig": "boundary. The table structure is described by the parame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.99,
"r_x1": 545.12,
"r_y1": 400.99,
"r_x2": 545.12,
"r_y2": 392.08,
"r_x3": 308.86,
"r_y3": 392.08,
"coord_origin": "TOPLEFT"
},
"text": "ters: Total number of table rows and columns, number of",
"orig": "ters: Total number of table rows and columns, number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.94,
"r_x1": 545.12,
"r_y1": 412.94,
"r_x2": 545.12,
"r_y2": 404.04,
"r_x3": 308.86,
"r_y3": 404.04,
"coord_origin": "TOPLEFT"
},
"text": "header rows, type of spans (header only spans, row only",
"orig": "header rows, type of spans (header only spans, row only",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.9,
"r_x1": 545.11,
"r_y1": 424.9,
"r_x2": 545.11,
"r_y2": 415.99,
"r_x3": 308.86,
"r_y3": 415.99,
"coord_origin": "TOPLEFT"
},
"text": "spans, column only spans, both row and column spans),",
"orig": "spans, column only spans, both row and column spans),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.85,
"r_x1": 545.12,
"r_y1": 436.85,
"r_x2": 545.12,
"r_y2": 427.95,
"r_x3": 308.86,
"r_y3": 427.95,
"coord_origin": "TOPLEFT"
},
"text": "maximum span size and the ratio of the table area covered",
"orig": "maximum span size and the ratio of the table area covered",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.81,
"r_x1": 345.94,
"r_y1": 448.81,
"r_x2": 345.94,
"r_y2": 439.9,
"r_x3": 308.86,
"r_y3": 439.9,
"coord_origin": "TOPLEFT"
},
"text": "by spans.",
"orig": "by spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 452.62,
"r": 545.12,
"b": 497.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.957,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 461.52,
"r_x1": 328.3,
"r_y1": 461.52,
"r_x2": 328.3,
"r_y2": 452.62,
"r_x3": 320.82,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.8,
"r_y0": 461.52,
"r_x1": 485.76,
"r_y1": 461.52,
"r_x2": 485.76,
"r_y2": 452.62,
"r_x3": 330.8,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": "Generate content: Based on the dataset",
"orig": "Generate content: Based on the dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.07,
"r_y0": 461.29,
"r_x1": 511.86,
"r_y1": 461.29,
"r_x2": 511.86,
"r_y2": 452.71,
"r_x3": 488.07,
"r_y3": 452.71,
"coord_origin": "TOPLEFT"
},
"text": "theme",
"orig": "theme",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.86,
"r_y0": 461.52,
"r_x1": 545.11,
"r_y1": 461.52,
"r_x2": 545.11,
"r_y2": 452.62,
"r_x3": 511.86,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": ", a set of",
"orig": ", a set of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 473.48,
"r_x1": 545.12,
"r_y1": 473.48,
"r_x2": 545.12,
"r_y2": 464.57,
"r_x3": 308.86,
"r_y3": 464.57,
"coord_origin": "TOPLEFT"
},
"text": "suitable content templates is chosen first. Then, this content",
"orig": "suitable content templates is chosen first. Then, this content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 485.43,
"r_x1": 545.12,
"r_y1": 485.43,
"r_x2": 545.12,
"r_y2": 476.53,
"r_x3": 308.86,
"r_y3": 476.53,
"coord_origin": "TOPLEFT"
},
"text": "can be combined with purely random text to produce the",
"orig": "can be combined with purely random text to produce the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.39,
"r_x1": 379.15,
"r_y1": 497.39,
"r_x2": 379.15,
"r_y2": 488.48,
"r_x3": 308.86,
"r_y3": 488.48,
"coord_origin": "TOPLEFT"
},
"text": "synthetic content.",
"orig": "synthetic content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 501.2,
"r": 545.12,
"b": 545.97,
"coord_origin": "TOPLEFT"
},
"confidence": 0.971,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 510.1,
"r_x1": 328.66,
"r_y1": 510.1,
"r_x2": 328.66,
"r_y2": 501.2,
"r_x3": 320.82,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.28,
"r_y0": 510.1,
"r_x1": 545.11,
"r_y1": 510.1,
"r_x2": 545.11,
"r_y2": 501.2,
"r_x3": 331.28,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "Apply styling templates: Depending on the domain",
"orig": "Apply styling templates: Depending on the domain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 522.06,
"r_x1": 545.12,
"r_y1": 522.06,
"r_x2": 545.12,
"r_y2": 513.15,
"r_x3": 308.86,
"r_y3": 513.15,
"coord_origin": "TOPLEFT"
},
"text": "of the synthetic dataset, a set of styling templates is first",
"orig": "of the synthetic dataset, a set of styling templates is first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 534.01,
"r_x1": 384.3,
"r_y1": 534.01,
"r_x2": 384.3,
"r_y2": 525.11,
"r_x3": 308.86,
"r_y3": 525.11,
"coord_origin": "TOPLEFT"
},
"text": "manually selected.",
"orig": "manually selected.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.25,
"r_y0": 534.01,
"r_x1": 545.12,
"r_y1": 534.01,
"r_x2": 545.12,
"r_y2": 525.11,
"r_x3": 391.25,
"r_y3": 525.11,
"coord_origin": "TOPLEFT"
},
"text": "Then, a style is randomly selected to",
"orig": "Then, a style is randomly selected to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.97,
"r_x1": 496.16,
"r_y1": 545.97,
"r_x2": 496.16,
"r_y2": 537.06,
"r_x3": 308.86,
"r_y3": 537.06,
"coord_origin": "TOPLEFT"
},
"text": "format the appearance of the synthesized table.",
"orig": "format the appearance of the synthesized table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 549.78,
"r": 545.12,
"b": 606.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 558.68,
"r_x1": 328.29,
"r_y1": 558.68,
"r_x2": 328.29,
"r_y2": 549.78,
"r_x3": 320.82,
"r_y3": 549.78,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 558.68,
"r_x1": 545.11,
"r_y1": 558.68,
"r_x2": 545.11,
"r_y2": 549.78,
"r_x3": 335.4,
"r_y3": 549.78,
"coord_origin": "TOPLEFT"
},
"text": "Render the complete tables: The synthetic table is",
"orig": "Render the complete tables: The synthetic table is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 570.64,
"r_x1": 545.12,
"r_y1": 570.64,
"r_x2": 545.12,
"r_y2": 561.73,
"r_x3": 308.86,
"r_y3": 561.73,
"coord_origin": "TOPLEFT"
},
"text": "finally rendered by a web browser engine to generate the",
"orig": "finally rendered by a web browser engine to generate the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 582.59,
"r_x1": 545.12,
"r_y1": 582.59,
"r_x2": 545.12,
"r_y2": 573.69,
"r_x3": 308.86,
"r_y3": 573.69,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes for each table cell. A batching technique is",
"orig": "bounding boxes for each table cell. A batching technique is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 594.55,
"r_x1": 545.12,
"r_y1": 594.55,
"r_x2": 545.12,
"r_y2": 585.64,
"r_x3": 308.86,
"r_y3": 585.64,
"coord_origin": "TOPLEFT"
},
"text": "utilized to optimize the runtime overhead of the rendering",
"orig": "utilized to optimize the runtime overhead of the rendering",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 606.5,
"r_x1": 341.23,
"r_y1": 606.5,
"r_x2": 341.23,
"r_y2": 597.6,
"r_x3": 308.86,
"r_y3": 597.6,
"coord_origin": "TOPLEFT"
},
"text": "process.",
"orig": "process.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 622.29,
"r": 545.11,
"b": 646.99,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 633.04,
"r_x1": 316.77,
"r_y1": 633.04,
"r_x2": 316.77,
"r_y2": 622.29,
"r_x3": 308.86,
"r_y3": 622.29,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.31,
"r_y0": 633.04,
"r_x1": 545.11,
"r_y1": 633.04,
"r_x2": 545.11,
"r_y2": 622.29,
"r_x3": 327.31,
"r_y3": 622.29,
"coord_origin": "TOPLEFT"
},
"text": "Prediction post-processing for PDF docu-",
"orig": "Prediction post-processing for PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 646.99,
"r_x1": 357.34,
"r_y1": 646.99,
"r_x2": 357.34,
"r_y2": 636.24,
"r_x3": 326.8,
"r_y3": 636.24,
"coord_origin": "TOPLEFT"
},
"text": "ments",
"orig": "ments",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 657.42,
"r": 545.12,
"b": 714.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 666.33,
"r_x1": 545.11,
"r_y1": 666.33,
"r_x2": 545.11,
"r_y2": 657.42,
"r_x3": 320.82,
"r_y3": 657.42,
"coord_origin": "TOPLEFT"
},
"text": "Although TableFormer can predict the table structure and",
"orig": "Although TableFormer can predict the table structure and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 678.28,
"r_x1": 545.12,
"r_y1": 678.28,
"r_x2": 545.12,
"r_y2": 669.38,
"r_x3": 308.86,
"r_y3": 669.38,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes for tables recognized inside PDF docu-",
"orig": "the bounding boxes for tables recognized inside PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 690.24,
"r_x1": 545.12,
"r_y1": 690.24,
"r_x2": 545.12,
"r_y2": 681.33,
"r_x3": 308.86,
"r_y3": 681.33,
"coord_origin": "TOPLEFT"
},
"text": "ments, this is not enough when a full reconstruction of the",
"orig": "ments, this is not enough when a full reconstruction of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 702.19,
"r_x1": 545.12,
"r_y1": 702.19,
"r_x2": 545.12,
"r_y2": 693.29,
"r_x3": 308.86,
"r_y3": 693.29,
"coord_origin": "TOPLEFT"
},
"text": "original table is required. This happens mainly due the fol-",
"orig": "original table is required. This happens mainly due the fol-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 714.15,
"r_x1": 371.43,
"r_y1": 714.15,
"r_x2": 371.43,
"r_y2": 705.24,
"r_x3": 308.86,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "lowing reasons:",
"orig": "lowing reasons:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.899,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "section_header",
"id": 18,
"page_no": 10,
"cluster": {
"id": 18,
"label": "section_header",
"bbox": {
"l": 132.84,
"t": 110.57,
"r": 465.38,
"b": 135.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.84,
"r_y0": 121.32,
"r_x1": 465.38,
"r_y1": 121.32,
"r_x2": 465.38,
"r_y2": 110.57,
"r_x3": 132.84,
"r_y3": 110.57,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers",
"orig": "TableFormer: Table Structure Understanding with Transformers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.18,
"r_y0": 135.53,
"r_x1": 375.04,
"r_y1": 135.53,
"r_x2": 375.04,
"r_y2": 122.26,
"r_x3": 220.18,
"r_y3": 122.26,
"coord_origin": "TOPLEFT"
},
"text": "Supplementary Material",
"orig": "Supplementary Material",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material"
},
{
"label": "section_header",
"id": 13,
"page_no": 10,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 161.16,
"r": 175.96,
"b": 171.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 171.91,
"r_x1": 57.09,
"r_y1": 171.91,
"r_x2": 57.09,
"r_y2": 161.16,
"r_x3": 50.11,
"r_y3": 161.16,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.39,
"r_y0": 171.91,
"r_x1": 175.96,
"r_y1": 171.91,
"r_x2": 175.96,
"r_y2": 161.16,
"r_x3": 66.39,
"r_y3": 161.16,
"coord_origin": "TOPLEFT"
},
"text": "Details on the datasets",
"orig": "Details on the datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Details on the datasets"
},
{
"label": "section_header",
"id": 11,
"page_no": 10,
"cluster": {
"id": 11,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 180.98,
"r": 150.36,
"b": 190.83,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 190.83,
"r_x1": 64.21,
"r_y1": 190.83,
"r_x2": 64.21,
"r_y2": 180.98,
"r_x3": 50.11,
"r_y3": 180.98,
"coord_origin": "TOPLEFT"
},
"text": "1.1.",
"orig": "1.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.61,
"r_y0": 190.83,
"r_x1": 150.36,
"r_y1": 190.83,
"r_x2": 150.36,
"r_y2": 180.98,
"r_x3": 73.61,
"r_y3": 180.98,
"coord_origin": "TOPLEFT"
},
"text": "Data preparation",
"orig": "Data preparation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1.1. Data preparation"
},
{
"label": "text",
"id": 0,
"page_no": 10,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 199.92,
"r": 286.37,
"b": 388.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 208.83,
"r_x1": 286.36,
"r_y1": 208.83,
"r_x2": 286.36,
"r_y2": 199.92,
"r_x3": 62.07,
"r_y3": 199.92,
"coord_origin": "TOPLEFT"
},
"text": "As a first step of our data preparation process, we have",
"orig": "As a first step of our data preparation process, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 220.78,
"r_x1": 286.37,
"r_y1": 220.78,
"r_x2": 286.37,
"r_y2": 211.88,
"r_x3": 50.11,
"r_y3": 211.88,
"coord_origin": "TOPLEFT"
},
"text": "calculated statistics over the datasets across the following",
"orig": "calculated statistics over the datasets across the following",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 232.74,
"r_x1": 286.37,
"r_y1": 232.74,
"r_x2": 286.37,
"r_y2": 223.83,
"r_x3": 50.11,
"r_y3": 223.83,
"coord_origin": "TOPLEFT"
},
"text": "dimensions: (1) table size measured in the number of rows",
"orig": "dimensions: (1) table size measured in the number of rows",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 244.69,
"r_x1": 286.37,
"r_y1": 244.69,
"r_x2": 286.37,
"r_y2": 235.79,
"r_x3": 50.11,
"r_y3": 235.79,
"coord_origin": "TOPLEFT"
},
"text": "and columns, (2) complexity of the table, (3) strictness of",
"orig": "and columns, (2) complexity of the table, (3) strictness of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 256.65,
"r_x1": 286.37,
"r_y1": 256.65,
"r_x2": 286.37,
"r_y2": 247.74,
"r_x3": 50.11,
"r_y3": 247.74,
"coord_origin": "TOPLEFT"
},
"text": "the provided HTML structure and (4) completeness (i.e. no",
"orig": "the provided HTML structure and (4) completeness (i.e. no",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 268.6,
"r_x1": 286.37,
"r_y1": 268.6,
"r_x2": 286.37,
"r_y2": 259.7,
"r_x3": 50.11,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "omitted bounding boxes). A table is considered to be simple",
"orig": "omitted bounding boxes). A table is considered to be simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 280.56,
"r_x1": 286.37,
"r_y1": 280.56,
"r_x2": 286.37,
"r_y2": 271.65,
"r_x3": 50.11,
"r_y3": 271.65,
"coord_origin": "TOPLEFT"
},
"text": "if it does not contain row spans or column spans. Addition-",
"orig": "if it does not contain row spans or column spans. Addition-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 292.51,
"r_x1": 286.37,
"r_y1": 292.51,
"r_x2": 286.37,
"r_y2": 283.61,
"r_x3": 50.11,
"r_y3": 283.61,
"coord_origin": "TOPLEFT"
},
"text": "ally, a table has a strict HTML structure if every row has the",
"orig": "ally, a table has a strict HTML structure if every row has the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 304.47,
"r_x1": 286.37,
"r_y1": 304.47,
"r_x2": 286.37,
"r_y2": 295.56,
"r_x3": 50.11,
"r_y3": 295.56,
"coord_origin": "TOPLEFT"
},
"text": "same number of columns after taking into account any row",
"orig": "same number of columns after taking into account any row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 316.42,
"r_x1": 286.37,
"r_y1": 316.42,
"r_x2": 286.37,
"r_y2": 307.52,
"r_x3": 50.11,
"r_y3": 307.52,
"coord_origin": "TOPLEFT"
},
"text": "or column spans. Therefore a strict HTML structure looks",
"orig": "or column spans. Therefore a strict HTML structure looks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 328.38,
"r_x1": 286.37,
"r_y1": 328.38,
"r_x2": 286.37,
"r_y2": 319.47,
"r_x3": 50.11,
"r_y3": 319.47,
"coord_origin": "TOPLEFT"
},
"text": "always rectangular. However, HTML is a lenient encoding",
"orig": "always rectangular. However, HTML is a lenient encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 340.33,
"r_x1": 286.37,
"r_y1": 340.33,
"r_x2": 286.37,
"r_y2": 331.43,
"r_x3": 50.11,
"r_y3": 331.43,
"coord_origin": "TOPLEFT"
},
"text": "format, i.e. tables with rows of different sizes might still",
"orig": "format, i.e. tables with rows of different sizes might still",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 352.29,
"r_x1": 286.37,
"r_y1": 352.29,
"r_x2": 286.37,
"r_y2": 343.38,
"r_x3": 50.11,
"r_y3": 343.38,
"coord_origin": "TOPLEFT"
},
"text": "be regarded as correct due to implicit display rules. These",
"orig": "be regarded as correct due to implicit display rules. These",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 364.24,
"r_x1": 286.37,
"r_y1": 364.24,
"r_x2": 286.37,
"r_y2": 355.34,
"r_x3": 50.11,
"r_y3": 355.34,
"coord_origin": "TOPLEFT"
},
"text": "implicit rules leave room for ambiguity, which we want to",
"orig": "implicit rules leave room for ambiguity, which we want to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 376.2,
"r_x1": 286.37,
"r_y1": 376.2,
"r_x2": 286.37,
"r_y2": 367.29,
"r_x3": 50.11,
"r_y3": 367.29,
"coord_origin": "TOPLEFT"
},
"text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 388.15,
"r_x1": 230.8,
"r_y1": 388.15,
"r_x2": 230.8,
"r_y2": 379.25,
"r_x3": 50.11,
"r_y3": 379.25,
"coord_origin": "TOPLEFT"
},
"text": "where every row has exactly the same length.",
"orig": "where every row has exactly the same length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). A table is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTML structure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have \"strict\" tables, i.e. tables where every row has exactly the same length."
},
{
"label": "text",
"id": 2,
"page_no": 10,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 391.41,
"r": 286.37,
"b": 627.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 400.31,
"r_x1": 286.36,
"r_y1": 400.31,
"r_x2": 286.36,
"r_y2": 391.41,
"r_x3": 62.07,
"r_y3": 391.41,
"coord_origin": "TOPLEFT"
},
"text": "We have developed a technique that tries to derive a",
"orig": "We have developed a technique that tries to derive a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 412.27,
"r_x1": 286.37,
"r_y1": 412.27,
"r_x2": 286.37,
"r_y2": 403.36,
"r_x3": 50.11,
"r_y3": 403.36,
"coord_origin": "TOPLEFT"
},
"text": "missing bounding box out of its neighbors. As a first step,",
"orig": "missing bounding box out of its neighbors. As a first step,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 424.22,
"r_x1": 286.37,
"r_y1": 424.22,
"r_x2": 286.37,
"r_y2": 415.32,
"r_x3": 50.11,
"r_y3": 415.32,
"coord_origin": "TOPLEFT"
},
"text": "we use the annotation data to generate the most fine-grained",
"orig": "we use the annotation data to generate the most fine-grained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 436.18,
"r_x1": 286.37,
"r_y1": 436.18,
"r_x2": 286.37,
"r_y2": 427.27,
"r_x3": 50.11,
"r_y3": 427.27,
"coord_origin": "TOPLEFT"
},
"text": "grid that covers the table structure. In case of strict HTML",
"orig": "grid that covers the table structure. In case of strict HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 448.13,
"r_x1": 286.37,
"r_y1": 448.13,
"r_x2": 286.37,
"r_y2": 439.23,
"r_x3": 50.11,
"r_y3": 439.23,
"coord_origin": "TOPLEFT"
},
"text": "tables, all grid squares are associated with some table cell",
"orig": "tables, all grid squares are associated with some table cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 460.09,
"r_x1": 286.37,
"r_y1": 460.09,
"r_x2": 286.37,
"r_y2": 451.18,
"r_x3": 50.11,
"r_y3": 451.18,
"coord_origin": "TOPLEFT"
},
"text": "and in the presence of table spans a cell extends across mul-",
"orig": "and in the presence of table spans a cell extends across mul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 472.04,
"r_x1": 286.37,
"r_y1": 472.04,
"r_x2": 286.37,
"r_y2": 463.14,
"r_x3": 50.11,
"r_y3": 463.14,
"coord_origin": "TOPLEFT"
},
"text": "tiple grid squares. When enough bounding boxes are known",
"orig": "tiple grid squares. When enough bounding boxes are known",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 484.0,
"r_x1": 286.37,
"r_y1": 484.0,
"r_x2": 286.37,
"r_y2": 475.09,
"r_x3": 50.11,
"r_y3": 475.09,
"coord_origin": "TOPLEFT"
},
"text": "for a rectangular table, it is possible to compute the geo-",
"orig": "for a rectangular table, it is possible to compute the geo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 495.95,
"r_x1": 286.37,
"r_y1": 495.95,
"r_x2": 286.37,
"r_y2": 487.05,
"r_x3": 50.11,
"r_y3": 487.05,
"coord_origin": "TOPLEFT"
},
"text": "metrical border lines between the grid rows and columns.",
"orig": "metrical border lines between the grid rows and columns.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 507.91,
"r_x1": 286.37,
"r_y1": 507.91,
"r_x2": 286.37,
"r_y2": 499.0,
"r_x3": 50.11,
"r_y3": 499.0,
"coord_origin": "TOPLEFT"
},
"text": "Eventually this information is used to generate the missing",
"orig": "Eventually this information is used to generate the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 519.86,
"r_x1": 286.37,
"r_y1": 519.86,
"r_x2": 286.37,
"r_y2": 510.96,
"r_x3": 50.11,
"r_y3": 510.96,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes. Additionally, the existence of unused grid",
"orig": "bounding boxes. Additionally, the existence of unused grid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 531.82,
"r_x1": 286.37,
"r_y1": 531.82,
"r_x2": 286.37,
"r_y2": 522.91,
"r_x3": 50.11,
"r_y3": 522.91,
"coord_origin": "TOPLEFT"
},
"text": "squares indicates that the table rows have unequal number",
"orig": "squares indicates that the table rows have unequal number",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 543.77,
"r_x1": 286.37,
"r_y1": 543.77,
"r_x2": 286.37,
"r_y2": 534.87,
"r_x3": 50.11,
"r_y3": 534.87,
"coord_origin": "TOPLEFT"
},
"text": "of columns and the overall structure is non-strict. The gen-",
"orig": "of columns and the overall structure is non-strict. The gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 555.73,
"r_x1": 286.37,
"r_y1": 555.73,
"r_x2": 286.37,
"r_y2": 546.82,
"r_x3": 50.11,
"r_y3": 546.82,
"coord_origin": "TOPLEFT"
},
"text": "eration of missing bounding boxes for non-strict HTML ta-",
"orig": "eration of missing bounding boxes for non-strict HTML ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 567.68,
"r_x1": 257.47,
"r_y1": 567.68,
"r_x2": 257.47,
"r_y2": 558.78,
"r_x3": 50.11,
"r_y3": 558.78,
"coord_origin": "TOPLEFT"
},
"text": "bles is ambiguous and therefore quite challenging.",
"orig": "bles is ambiguous and therefore quite challenging.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.95,
"r_y0": 567.68,
"r_x1": 286.37,
"r_y1": 567.68,
"r_x2": 286.37,
"r_y2": 558.78,
"r_x3": 263.95,
"r_y3": 558.78,
"coord_origin": "TOPLEFT"
},
"text": "Thus,",
"orig": "Thus,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 579.64,
"r_x1": 286.37,
"r_y1": 579.64,
"r_x2": 286.37,
"r_y2": 570.73,
"r_x3": 50.11,
"r_y3": 570.73,
"coord_origin": "TOPLEFT"
},
"text": "we have decided to simply discard those tables. In case of",
"orig": "we have decided to simply discard those tables. In case of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 591.59,
"r_x1": 286.37,
"r_y1": 591.59,
"r_x2": 286.37,
"r_y2": 582.69,
"r_x3": 50.11,
"r_y3": 582.69,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet we have computed missing bounding boxes for",
"orig": "PubTabNet we have computed missing bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 603.55,
"r_x1": 286.37,
"r_y1": 603.55,
"r_x2": 286.37,
"r_y2": 594.64,
"r_x3": 50.11,
"r_y3": 594.64,
"coord_origin": "TOPLEFT"
},
"text": "48% of the simple and 69% of the complex tables. Regard-",
"orig": "48% of the simple and 69% of the complex tables. Regard-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 615.5,
"r_x1": 286.37,
"r_y1": 615.5,
"r_x2": 286.37,
"r_y2": 606.6,
"r_x3": 50.11,
"r_y3": 606.6,
"coord_origin": "TOPLEFT"
},
"text": "ing FinTabNet, 68% of the simple and 98% of the complex",
"orig": "ing FinTabNet, 68% of the simple and 98% of the complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 627.46,
"r_x1": 242.26,
"r_y1": 627.46,
"r_x2": 242.26,
"r_y2": 618.55,
"r_x3": 50.11,
"r_y3": 618.55,
"coord_origin": "TOPLEFT"
},
"text": "tables require the generation of bounding boxes.",
"orig": "tables require the generation of bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."
},
{
"label": "text",
"id": 14,
"page_no": 10,
"cluster": {
"id": 14,
"label": "text",
"bbox": {
"l": 50.11,
"t": 630.71,
"r": 286.36,
"b": 651.57,
"coord_origin": "TOPLEFT"
},
"confidence": 0.934,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 639.62,
"r_x1": 286.36,
"r_y1": 639.62,
"r_x2": 286.36,
"r_y2": 630.71,
"r_x3": 62.07,
"r_y3": 630.71,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7 illustrates the distribution of the tables across",
"orig": "Figure 7 illustrates the distribution of the tables across",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 651.57,
"r_x1": 179.9,
"r_y1": 651.57,
"r_x2": 179.9,
"r_y2": 642.67,
"r_x3": 50.11,
"r_y3": 642.67,
"coord_origin": "TOPLEFT"
},
"text": "different dimensions per dataset.",
"orig": "different dimensions per dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset."
},
{
"label": "section_header",
"id": 12,
"page_no": 10,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 662.39,
"r": 153.61,
"b": 672.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.952,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 672.24,
"r_x1": 64.3,
"r_y1": 672.24,
"r_x2": 64.3,
"r_y2": 662.39,
"r_x3": 50.11,
"r_y3": 662.39,
"coord_origin": "TOPLEFT"
},
"text": "1.2.",
"orig": "1.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.75,
"r_y0": 672.24,
"r_x1": 153.61,
"r_y1": 672.24,
"r_x2": 153.61,
"r_y2": 662.39,
"r_x3": 73.75,
"r_y3": 662.39,
"coord_origin": "TOPLEFT"
},
"text": "Synthetic datasets",
"orig": "Synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1.2. Synthetic datasets"
},
{
"label": "text",
"id": 3,
"page_no": 10,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 681.33,
"r": 286.37,
"b": 714.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 690.24,
"r_x1": 286.36,
"r_y1": 690.24,
"r_x2": 286.36,
"r_y2": 681.33,
"r_x3": 62.07,
"r_y3": 681.33,
"coord_origin": "TOPLEFT"
},
"text": "Aiming to train and evaluate our models in a broader",
"orig": "Aiming to train and evaluate our models in a broader",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 702.19,
"r_x1": 286.37,
"r_y1": 702.19,
"r_x2": 286.37,
"r_y2": 693.29,
"r_x3": 50.11,
"r_y3": 693.29,
"coord_origin": "TOPLEFT"
},
"text": "spectrum of table data we have synthesized four types of",
"orig": "spectrum of table data we have synthesized four types of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 714.15,
"r_x1": 84.14,
"r_y1": 714.15,
"r_x2": 84.14,
"r_y2": 705.24,
"r_x3": 50.11,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "datasets.",
"orig": "datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.24,
"r_y0": 714.15,
"r_x1": 286.37,
"r_y1": 714.15,
"r_x2": 286.37,
"r_y2": 705.24,
"r_x3": 91.24,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "Each one contains tables with different appear-",
"orig": "Each one contains tables with different appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-"
},
{
"label": "text",
"id": 8,
"page_no": 10,
"cluster": {
"id": 8,
"label": "text",
"bbox": {
"l": 308.86,
"t": 162.66,
"r": 545.12,
"b": 207.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 171.56,
"r_x1": 545.12,
"r_y1": 171.56,
"r_x2": 545.12,
"r_y2": 162.66,
"r_x3": 308.86,
"r_y3": 162.66,
"coord_origin": "TOPLEFT"
},
"text": "ances in regard to their size, structure, style and content.",
"orig": "ances in regard to their size, structure, style and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 183.52,
"r_x1": 545.12,
"r_y1": 183.52,
"r_x2": 545.12,
"r_y2": 174.61,
"r_x3": 308.86,
"r_y3": 174.61,
"coord_origin": "TOPLEFT"
},
"text": "Every synthetic dataset contains 150k examples, summing",
"orig": "Every synthetic dataset contains 150k examples, summing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 195.47,
"r_x1": 545.12,
"r_y1": 195.47,
"r_x2": 545.12,
"r_y2": 186.57,
"r_x3": 308.86,
"r_y3": 186.57,
"coord_origin": "TOPLEFT"
},
"text": "up to 600k synthetic examples. All datasets are divided into",
"orig": "up to 600k synthetic examples. All datasets are divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 207.43,
"r_x1": 484.07,
"r_y1": 207.43,
"r_x2": 484.07,
"r_y2": 198.52,
"r_x3": 308.86,
"r_y3": 198.52,
"coord_origin": "TOPLEFT"
},
"text": "Train, Test and Val splits (80%, 10%, 10%).",
"orig": "Train, Test and Val splits (80%, 10%, 10%).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)."
},
{
"label": "text",
"id": 15,
"page_no": 10,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 308.86,
"t": 211.24,
"r": 545.12,
"b": 232.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 220.14,
"r_x1": 545.12,
"r_y1": 220.14,
"r_x2": 545.12,
"r_y2": 211.24,
"r_x3": 320.82,
"r_y3": 211.24,
"coord_origin": "TOPLEFT"
},
"text": "The process of generating a synthetic dataset can be de-",
"orig": "The process of generating a synthetic dataset can be de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 232.1,
"r_x1": 448.09,
"r_y1": 232.1,
"r_x2": 448.09,
"r_y2": 223.19,
"r_x3": 308.86,
"r_y3": 223.19,
"coord_origin": "TOPLEFT"
},
"text": "composed into the following steps:",
"orig": "composed into the following steps:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The process of generating a synthetic dataset can be decomposed into the following steps:"
},
{
"label": "list_item",
"id": 7,
"page_no": 10,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 235.91,
"r": 545.12,
"b": 316.54,
"coord_origin": "TOPLEFT"
},
"confidence": 0.964,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 244.81,
"r_x1": 328.29,
"r_y1": 244.81,
"r_x2": 328.29,
"r_y2": 235.91,
"r_x3": 320.82,
"r_y3": 235.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.38,
"r_y0": 244.81,
"r_x1": 545.11,
"r_y1": 244.81,
"r_x2": 545.11,
"r_y2": 235.91,
"r_x3": 335.38,
"r_y3": 235.91,
"coord_origin": "TOPLEFT"
},
"text": "Prepare styling and content templates: The styling",
"orig": "Prepare styling and content templates: The styling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 256.77,
"r_x1": 545.12,
"r_y1": 256.77,
"r_x2": 545.12,
"r_y2": 247.86,
"r_x3": 308.86,
"r_y3": 247.86,
"coord_origin": "TOPLEFT"
},
"text": "templates have been manually designed and organized into",
"orig": "templates have been manually designed and organized into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 268.72,
"r_x1": 545.12,
"r_y1": 268.72,
"r_x2": 545.12,
"r_y2": 259.82,
"r_x3": 308.86,
"r_y3": 259.82,
"coord_origin": "TOPLEFT"
},
"text": "groups of scope specific appearances (e.g. financial data,",
"orig": "groups of scope specific appearances (e.g. financial data,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 280.68,
"r_x1": 393.38,
"r_y1": 280.68,
"r_x2": 393.38,
"r_y2": 271.77,
"r_x3": 308.86,
"r_y3": 271.77,
"coord_origin": "TOPLEFT"
},
"text": "marketing data, etc.)",
"orig": "marketing data, etc.)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.12,
"r_y0": 280.68,
"r_x1": 545.12,
"r_y1": 280.68,
"r_x2": 545.12,
"r_y2": 271.77,
"r_x3": 400.12,
"r_y3": 271.77,
"coord_origin": "TOPLEFT"
},
"text": "Additionally, we have prepared cu-",
"orig": "Additionally, we have prepared cu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 292.63,
"r_x1": 545.12,
"r_y1": 292.63,
"r_x2": 545.12,
"r_y2": 283.73,
"r_x3": 308.86,
"r_y3": 283.73,
"coord_origin": "TOPLEFT"
},
"text": "rated collections of content templates by extracting the most",
"orig": "rated collections of content templates by extracting the most",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.59,
"r_x1": 545.12,
"r_y1": 304.59,
"r_x2": 545.12,
"r_y2": 295.68,
"r_x3": 308.86,
"r_y3": 295.68,
"coord_origin": "TOPLEFT"
},
"text": "frequently used terms out of non-synthetic datasets (e.g.",
"orig": "frequently used terms out of non-synthetic datasets (e.g.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.54,
"r_x1": 425.69,
"r_y1": 316.54,
"r_x2": 425.69,
"r_y2": 307.64,
"r_x3": 308.86,
"r_y3": 307.64,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet, FinTabNet, etc.).",
"orig": "PubTabNet, FinTabNet, etc.).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)."
},
{
"label": "list_item",
"id": 6,
"page_no": 10,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 320.35,
"r": 545.12,
"b": 448.81,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 329.26,
"r_x1": 328.49,
"r_y1": 329.26,
"r_x2": 328.49,
"r_y2": 320.35,
"r_x3": 320.82,
"r_y3": 320.35,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.05,
"r_y0": 329.26,
"r_x1": 545.11,
"r_y1": 329.26,
"r_x2": 545.11,
"r_y2": 320.35,
"r_x3": 331.05,
"r_y3": 320.35,
"coord_origin": "TOPLEFT"
},
"text": "Generate table structures: The structure of each syn-",
"orig": "Generate table structures: The structure of each syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 341.21,
"r_x1": 545.12,
"r_y1": 341.21,
"r_x2": 545.12,
"r_y2": 332.31,
"r_x3": 308.86,
"r_y3": 332.31,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset assumes a horizontal table header which po-",
"orig": "thetic dataset assumes a horizontal table header which po-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 353.17,
"r_x1": 545.12,
"r_y1": 353.17,
"r_x2": 545.12,
"r_y2": 344.26,
"r_x3": 308.86,
"r_y3": 344.26,
"coord_origin": "TOPLEFT"
},
"text": "tentially spans over multiple rows and a table body that",
"orig": "tentially spans over multiple rows and a table body that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 365.12,
"r_x1": 545.12,
"r_y1": 365.12,
"r_x2": 545.12,
"r_y2": 356.22,
"r_x3": 308.86,
"r_y3": 356.22,
"coord_origin": "TOPLEFT"
},
"text": "may contain a combination of row spans and column spans.",
"orig": "may contain a combination of row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 377.08,
"r_x1": 545.12,
"r_y1": 377.08,
"r_x2": 545.12,
"r_y2": 368.17,
"r_x3": 308.86,
"r_y3": 368.17,
"coord_origin": "TOPLEFT"
},
"text": "However, spans are not allowed to cross the header - body",
"orig": "However, spans are not allowed to cross the header - body",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 389.03,
"r_x1": 545.11,
"r_y1": 389.03,
"r_x2": 545.11,
"r_y2": 380.13,
"r_x3": 308.86,
"r_y3": 380.13,
"coord_origin": "TOPLEFT"
},
"text": "boundary. The table structure is described by the parame-",
"orig": "boundary. The table structure is described by the parame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.99,
"r_x1": 545.12,
"r_y1": 400.99,
"r_x2": 545.12,
"r_y2": 392.08,
"r_x3": 308.86,
"r_y3": 392.08,
"coord_origin": "TOPLEFT"
},
"text": "ters: Total number of table rows and columns, number of",
"orig": "ters: Total number of table rows and columns, number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.94,
"r_x1": 545.12,
"r_y1": 412.94,
"r_x2": 545.12,
"r_y2": 404.04,
"r_x3": 308.86,
"r_y3": 404.04,
"coord_origin": "TOPLEFT"
},
"text": "header rows, type of spans (header only spans, row only",
"orig": "header rows, type of spans (header only spans, row only",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.9,
"r_x1": 545.11,
"r_y1": 424.9,
"r_x2": 545.11,
"r_y2": 415.99,
"r_x3": 308.86,
"r_y3": 415.99,
"coord_origin": "TOPLEFT"
},
"text": "spans, column only spans, both row and column spans),",
"orig": "spans, column only spans, both row and column spans),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.85,
"r_x1": 545.12,
"r_y1": 436.85,
"r_x2": 545.12,
"r_y2": 427.95,
"r_x3": 308.86,
"r_y3": 427.95,
"coord_origin": "TOPLEFT"
},
"text": "maximum span size and the ratio of the table area covered",
"orig": "maximum span size and the ratio of the table area covered",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.81,
"r_x1": 345.94,
"r_y1": 448.81,
"r_x2": 345.94,
"r_y2": 439.9,
"r_x3": 308.86,
"r_y3": 439.9,
"coord_origin": "TOPLEFT"
},
"text": "by spans.",
"orig": "by spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans."
},
{
"label": "list_item",
"id": 9,
"page_no": 10,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 452.62,
"r": 545.12,
"b": 497.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.957,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 461.52,
"r_x1": 328.3,
"r_y1": 461.52,
"r_x2": 328.3,
"r_y2": 452.62,
"r_x3": 320.82,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.8,
"r_y0": 461.52,
"r_x1": 485.76,
"r_y1": 461.52,
"r_x2": 485.76,
"r_y2": 452.62,
"r_x3": 330.8,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": "Generate content: Based on the dataset",
"orig": "Generate content: Based on the dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.07,
"r_y0": 461.29,
"r_x1": 511.86,
"r_y1": 461.29,
"r_x2": 511.86,
"r_y2": 452.71,
"r_x3": 488.07,
"r_y3": 452.71,
"coord_origin": "TOPLEFT"
},
"text": "theme",
"orig": "theme",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.86,
"r_y0": 461.52,
"r_x1": 545.11,
"r_y1": 461.52,
"r_x2": 545.11,
"r_y2": 452.62,
"r_x3": 511.86,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": ", a set of",
"orig": ", a set of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 473.48,
"r_x1": 545.12,
"r_y1": 473.48,
"r_x2": 545.12,
"r_y2": 464.57,
"r_x3": 308.86,
"r_y3": 464.57,
"coord_origin": "TOPLEFT"
},
"text": "suitable content templates is chosen first. Then, this content",
"orig": "suitable content templates is chosen first. Then, this content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 485.43,
"r_x1": 545.12,
"r_y1": 485.43,
"r_x2": 545.12,
"r_y2": 476.53,
"r_x3": 308.86,
"r_y3": 476.53,
"coord_origin": "TOPLEFT"
},
"text": "can be combined with purely random text to produce the",
"orig": "can be combined with purely random text to produce the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.39,
"r_x1": 379.15,
"r_y1": 497.39,
"r_x2": 379.15,
"r_y2": 488.48,
"r_x3": 308.86,
"r_y3": 488.48,
"coord_origin": "TOPLEFT"
},
"text": "synthetic content.",
"orig": "synthetic content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content."
},
{
"label": "list_item",
"id": 5,
"page_no": 10,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 501.2,
"r": 545.12,
"b": 545.97,
"coord_origin": "TOPLEFT"
},
"confidence": 0.971,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 510.1,
"r_x1": 328.66,
"r_y1": 510.1,
"r_x2": 328.66,
"r_y2": 501.2,
"r_x3": 320.82,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.28,
"r_y0": 510.1,
"r_x1": 545.11,
"r_y1": 510.1,
"r_x2": 545.11,
"r_y2": 501.2,
"r_x3": 331.28,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "Apply styling templates: Depending on the domain",
"orig": "Apply styling templates: Depending on the domain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 522.06,
"r_x1": 545.12,
"r_y1": 522.06,
"r_x2": 545.12,
"r_y2": 513.15,
"r_x3": 308.86,
"r_y3": 513.15,
"coord_origin": "TOPLEFT"
},
"text": "of the synthetic dataset, a set of styling templates is first",
"orig": "of the synthetic dataset, a set of styling templates is first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 534.01,
"r_x1": 384.3,
"r_y1": 534.01,
"r_x2": 384.3,
"r_y2": 525.11,
"r_x3": 308.86,
"r_y3": 525.11,
"coord_origin": "TOPLEFT"
},
"text": "manually selected.",
"orig": "manually selected.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.25,
"r_y0": 534.01,
"r_x1": 545.12,
"r_y1": 534.01,
"r_x2": 545.12,
"r_y2": 525.11,
"r_x3": 391.25,
"r_y3": 525.11,
"coord_origin": "TOPLEFT"
},
"text": "Then, a style is randomly selected to",
"orig": "Then, a style is randomly selected to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.97,
"r_x1": 496.16,
"r_y1": 545.97,
"r_x2": 496.16,
"r_y2": 537.06,
"r_x3": 308.86,
"r_y3": 537.06,
"coord_origin": "TOPLEFT"
},
"text": "format the appearance of the synthesized table.",
"orig": "format the appearance of the synthesized table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table."
},
{
"label": "list_item",
"id": 4,
"page_no": 10,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 549.78,
"r": 545.12,
"b": 606.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 558.68,
"r_x1": 328.29,
"r_y1": 558.68,
"r_x2": 328.29,
"r_y2": 549.78,
"r_x3": 320.82,
"r_y3": 549.78,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 558.68,
"r_x1": 545.11,
"r_y1": 558.68,
"r_x2": 545.11,
"r_y2": 549.78,
"r_x3": 335.4,
"r_y3": 549.78,
"coord_origin": "TOPLEFT"
},
"text": "Render the complete tables: The synthetic table is",
"orig": "Render the complete tables: The synthetic table is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 570.64,
"r_x1": 545.12,
"r_y1": 570.64,
"r_x2": 545.12,
"r_y2": 561.73,
"r_x3": 308.86,
"r_y3": 561.73,
"coord_origin": "TOPLEFT"
},
"text": "finally rendered by a web browser engine to generate the",
"orig": "finally rendered by a web browser engine to generate the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 582.59,
"r_x1": 545.12,
"r_y1": 582.59,
"r_x2": 545.12,
"r_y2": 573.69,
"r_x3": 308.86,
"r_y3": 573.69,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes for each table cell. A batching technique is",
"orig": "bounding boxes for each table cell. A batching technique is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 594.55,
"r_x1": 545.12,
"r_y1": 594.55,
"r_x2": 545.12,
"r_y2": 585.64,
"r_x3": 308.86,
"r_y3": 585.64,
"coord_origin": "TOPLEFT"
},
"text": "utilized to optimize the runtime overhead of the rendering",
"orig": "utilized to optimize the runtime overhead of the rendering",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 606.5,
"r_x1": 341.23,
"r_y1": 606.5,
"r_x2": 341.23,
"r_y2": 597.6,
"r_x3": 308.86,
"r_y3": 597.6,
"coord_origin": "TOPLEFT"
},
"text": "process.",
"orig": "process.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process."
},
{
"label": "section_header",
"id": 10,
"page_no": 10,
"cluster": {
"id": 10,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 622.29,
"r": 545.11,
"b": 646.99,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 633.04,
"r_x1": 316.77,
"r_y1": 633.04,
"r_x2": 316.77,
"r_y2": 622.29,
"r_x3": 308.86,
"r_y3": 622.29,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.31,
"r_y0": 633.04,
"r_x1": 545.11,
"r_y1": 633.04,
"r_x2": 545.11,
"r_y2": 622.29,
"r_x3": 327.31,
"r_y3": 622.29,
"coord_origin": "TOPLEFT"
},
"text": "Prediction post-processing for PDF docu-",
"orig": "Prediction post-processing for PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 646.99,
"r_x1": 357.34,
"r_y1": 646.99,
"r_x2": 357.34,
"r_y2": 636.24,
"r_x3": 326.8,
"r_y3": 636.24,
"coord_origin": "TOPLEFT"
},
"text": "ments",
"orig": "ments",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Prediction post-processing for PDF documents"
},
{
"label": "text",
"id": 1,
"page_no": 10,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 657.42,
"r": 545.12,
"b": 714.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 666.33,
"r_x1": 545.11,
"r_y1": 666.33,
"r_x2": 545.11,
"r_y2": 657.42,
"r_x3": 320.82,
"r_y3": 657.42,
"coord_origin": "TOPLEFT"
},
"text": "Although TableFormer can predict the table structure and",
"orig": "Although TableFormer can predict the table structure and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 678.28,
"r_x1": 545.12,
"r_y1": 678.28,
"r_x2": 545.12,
"r_y2": 669.38,
"r_x3": 308.86,
"r_y3": 669.38,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes for tables recognized inside PDF docu-",
"orig": "the bounding boxes for tables recognized inside PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 690.24,
"r_x1": 545.12,
"r_y1": 690.24,
"r_x2": 545.12,
"r_y2": 681.33,
"r_x3": 308.86,
"r_y3": 681.33,
"coord_origin": "TOPLEFT"
},
"text": "ments, this is not enough when a full reconstruction of the",
"orig": "ments, this is not enough when a full reconstruction of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 702.19,
"r_x1": 545.12,
"r_y1": 702.19,
"r_x2": 545.12,
"r_y2": 693.29,
"r_x3": 308.86,
"r_y3": 693.29,
"coord_origin": "TOPLEFT"
},
"text": "original table is required. This happens mainly due the fol-",
"orig": "original table is required. This happens mainly due the fol-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 714.15,
"r_x1": 371.43,
"r_y1": 714.15,
"r_x2": 371.43,
"r_y2": 705.24,
"r_x3": 308.86,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "lowing reasons:",
"orig": "lowing reasons:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:"
},
{
"label": "page_footer",
"id": 16,
"page_no": 10,
"cluster": {
"id": 16,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.899,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "11"
}
],
"body": [
{
"label": "section_header",
"id": 18,
"page_no": 10,
"cluster": {
"id": 18,
"label": "section_header",
"bbox": {
"l": 132.84,
"t": 110.57,
"r": 465.38,
"b": 135.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.84,
"r_y0": 121.32,
"r_x1": 465.38,
"r_y1": 121.32,
"r_x2": 465.38,
"r_y2": 110.57,
"r_x3": 132.84,
"r_y3": 110.57,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers",
"orig": "TableFormer: Table Structure Understanding with Transformers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.18,
"r_y0": 135.53,
"r_x1": 375.04,
"r_y1": 135.53,
"r_x2": 375.04,
"r_y2": 122.26,
"r_x3": 220.18,
"r_y3": 122.26,
"coord_origin": "TOPLEFT"
},
"text": "Supplementary Material",
"orig": "Supplementary Material",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material"
},
{
"label": "section_header",
"id": 13,
"page_no": 10,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 161.16,
"r": 175.96,
"b": 171.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 171.91,
"r_x1": 57.09,
"r_y1": 171.91,
"r_x2": 57.09,
"r_y2": 161.16,
"r_x3": 50.11,
"r_y3": 161.16,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.39,
"r_y0": 171.91,
"r_x1": 175.96,
"r_y1": 171.91,
"r_x2": 175.96,
"r_y2": 161.16,
"r_x3": 66.39,
"r_y3": 161.16,
"coord_origin": "TOPLEFT"
},
"text": "Details on the datasets",
"orig": "Details on the datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Details on the datasets"
},
{
"label": "section_header",
"id": 11,
"page_no": 10,
"cluster": {
"id": 11,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 180.98,
"r": 150.36,
"b": 190.83,
"coord_origin": "TOPLEFT"
},
"confidence": 0.954,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 190.83,
"r_x1": 64.21,
"r_y1": 190.83,
"r_x2": 64.21,
"r_y2": 180.98,
"r_x3": 50.11,
"r_y3": 180.98,
"coord_origin": "TOPLEFT"
},
"text": "1.1.",
"orig": "1.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.61,
"r_y0": 190.83,
"r_x1": 150.36,
"r_y1": 190.83,
"r_x2": 150.36,
"r_y2": 180.98,
"r_x3": 73.61,
"r_y3": 180.98,
"coord_origin": "TOPLEFT"
},
"text": "Data preparation",
"orig": "Data preparation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1.1. Data preparation"
},
{
"label": "text",
"id": 0,
"page_no": 10,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 199.92,
"r": 286.37,
"b": 388.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.986,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 208.83,
"r_x1": 286.36,
"r_y1": 208.83,
"r_x2": 286.36,
"r_y2": 199.92,
"r_x3": 62.07,
"r_y3": 199.92,
"coord_origin": "TOPLEFT"
},
"text": "As a first step of our data preparation process, we have",
"orig": "As a first step of our data preparation process, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 220.78,
"r_x1": 286.37,
"r_y1": 220.78,
"r_x2": 286.37,
"r_y2": 211.88,
"r_x3": 50.11,
"r_y3": 211.88,
"coord_origin": "TOPLEFT"
},
"text": "calculated statistics over the datasets across the following",
"orig": "calculated statistics over the datasets across the following",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 232.74,
"r_x1": 286.37,
"r_y1": 232.74,
"r_x2": 286.37,
"r_y2": 223.83,
"r_x3": 50.11,
"r_y3": 223.83,
"coord_origin": "TOPLEFT"
},
"text": "dimensions: (1) table size measured in the number of rows",
"orig": "dimensions: (1) table size measured in the number of rows",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 244.69,
"r_x1": 286.37,
"r_y1": 244.69,
"r_x2": 286.37,
"r_y2": 235.79,
"r_x3": 50.11,
"r_y3": 235.79,
"coord_origin": "TOPLEFT"
},
"text": "and columns, (2) complexity of the table, (3) strictness of",
"orig": "and columns, (2) complexity of the table, (3) strictness of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 256.65,
"r_x1": 286.37,
"r_y1": 256.65,
"r_x2": 286.37,
"r_y2": 247.74,
"r_x3": 50.11,
"r_y3": 247.74,
"coord_origin": "TOPLEFT"
},
"text": "the provided HTML structure and (4) completeness (i.e. no",
"orig": "the provided HTML structure and (4) completeness (i.e. no",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 268.6,
"r_x1": 286.37,
"r_y1": 268.6,
"r_x2": 286.37,
"r_y2": 259.7,
"r_x3": 50.11,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "omitted bounding boxes). A table is considered to be simple",
"orig": "omitted bounding boxes). A table is considered to be simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 280.56,
"r_x1": 286.37,
"r_y1": 280.56,
"r_x2": 286.37,
"r_y2": 271.65,
"r_x3": 50.11,
"r_y3": 271.65,
"coord_origin": "TOPLEFT"
},
"text": "if it does not contain row spans or column spans. Addition-",
"orig": "if it does not contain row spans or column spans. Addition-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 292.51,
"r_x1": 286.37,
"r_y1": 292.51,
"r_x2": 286.37,
"r_y2": 283.61,
"r_x3": 50.11,
"r_y3": 283.61,
"coord_origin": "TOPLEFT"
},
"text": "ally, a table has a strict HTML structure if every row has the",
"orig": "ally, a table has a strict HTML structure if every row has the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 304.47,
"r_x1": 286.37,
"r_y1": 304.47,
"r_x2": 286.37,
"r_y2": 295.56,
"r_x3": 50.11,
"r_y3": 295.56,
"coord_origin": "TOPLEFT"
},
"text": "same number of columns after taking into account any row",
"orig": "same number of columns after taking into account any row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 316.42,
"r_x1": 286.37,
"r_y1": 316.42,
"r_x2": 286.37,
"r_y2": 307.52,
"r_x3": 50.11,
"r_y3": 307.52,
"coord_origin": "TOPLEFT"
},
"text": "or column spans. Therefore a strict HTML structure looks",
"orig": "or column spans. Therefore a strict HTML structure looks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 328.38,
"r_x1": 286.37,
"r_y1": 328.38,
"r_x2": 286.37,
"r_y2": 319.47,
"r_x3": 50.11,
"r_y3": 319.47,
"coord_origin": "TOPLEFT"
},
"text": "always rectangular. However, HTML is a lenient encoding",
"orig": "always rectangular. However, HTML is a lenient encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 340.33,
"r_x1": 286.37,
"r_y1": 340.33,
"r_x2": 286.37,
"r_y2": 331.43,
"r_x3": 50.11,
"r_y3": 331.43,
"coord_origin": "TOPLEFT"
},
"text": "format, i.e. tables with rows of different sizes might still",
"orig": "format, i.e. tables with rows of different sizes might still",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 352.29,
"r_x1": 286.37,
"r_y1": 352.29,
"r_x2": 286.37,
"r_y2": 343.38,
"r_x3": 50.11,
"r_y3": 343.38,
"coord_origin": "TOPLEFT"
},
"text": "be regarded as correct due to implicit display rules. These",
"orig": "be regarded as correct due to implicit display rules. These",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 364.24,
"r_x1": 286.37,
"r_y1": 364.24,
"r_x2": 286.37,
"r_y2": 355.34,
"r_x3": 50.11,
"r_y3": 355.34,
"coord_origin": "TOPLEFT"
},
"text": "implicit rules leave room for ambiguity, which we want to",
"orig": "implicit rules leave room for ambiguity, which we want to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 376.2,
"r_x1": 286.37,
"r_y1": 376.2,
"r_x2": 286.37,
"r_y2": 367.29,
"r_x3": 50.11,
"r_y3": 367.29,
"coord_origin": "TOPLEFT"
},
"text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 388.15,
"r_x1": 230.8,
"r_y1": 388.15,
"r_x2": 230.8,
"r_y2": 379.25,
"r_x3": 50.11,
"r_y3": 379.25,
"coord_origin": "TOPLEFT"
},
"text": "where every row has exactly the same length.",
"orig": "where every row has exactly the same length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). A table is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTML structure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have \"strict\" tables, i.e. tables where every row has exactly the same length."
},
{
"label": "text",
"id": 2,
"page_no": 10,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.11,
"t": 391.41,
"r": 286.37,
"b": 627.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 400.31,
"r_x1": 286.36,
"r_y1": 400.31,
"r_x2": 286.36,
"r_y2": 391.41,
"r_x3": 62.07,
"r_y3": 391.41,
"coord_origin": "TOPLEFT"
},
"text": "We have developed a technique that tries to derive a",
"orig": "We have developed a technique that tries to derive a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 412.27,
"r_x1": 286.37,
"r_y1": 412.27,
"r_x2": 286.37,
"r_y2": 403.36,
"r_x3": 50.11,
"r_y3": 403.36,
"coord_origin": "TOPLEFT"
},
"text": "missing bounding box out of its neighbors. As a first step,",
"orig": "missing bounding box out of its neighbors. As a first step,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 424.22,
"r_x1": 286.37,
"r_y1": 424.22,
"r_x2": 286.37,
"r_y2": 415.32,
"r_x3": 50.11,
"r_y3": 415.32,
"coord_origin": "TOPLEFT"
},
"text": "we use the annotation data to generate the most fine-grained",
"orig": "we use the annotation data to generate the most fine-grained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 436.18,
"r_x1": 286.37,
"r_y1": 436.18,
"r_x2": 286.37,
"r_y2": 427.27,
"r_x3": 50.11,
"r_y3": 427.27,
"coord_origin": "TOPLEFT"
},
"text": "grid that covers the table structure. In case of strict HTML",
"orig": "grid that covers the table structure. In case of strict HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 448.13,
"r_x1": 286.37,
"r_y1": 448.13,
"r_x2": 286.37,
"r_y2": 439.23,
"r_x3": 50.11,
"r_y3": 439.23,
"coord_origin": "TOPLEFT"
},
"text": "tables, all grid squares are associated with some table cell",
"orig": "tables, all grid squares are associated with some table cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 460.09,
"r_x1": 286.37,
"r_y1": 460.09,
"r_x2": 286.37,
"r_y2": 451.18,
"r_x3": 50.11,
"r_y3": 451.18,
"coord_origin": "TOPLEFT"
},
"text": "and in the presence of table spans a cell extends across mul-",
"orig": "and in the presence of table spans a cell extends across mul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 472.04,
"r_x1": 286.37,
"r_y1": 472.04,
"r_x2": 286.37,
"r_y2": 463.14,
"r_x3": 50.11,
"r_y3": 463.14,
"coord_origin": "TOPLEFT"
},
"text": "tiple grid squares. When enough bounding boxes are known",
"orig": "tiple grid squares. When enough bounding boxes are known",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 484.0,
"r_x1": 286.37,
"r_y1": 484.0,
"r_x2": 286.37,
"r_y2": 475.09,
"r_x3": 50.11,
"r_y3": 475.09,
"coord_origin": "TOPLEFT"
},
"text": "for a rectangular table, it is possible to compute the geo-",
"orig": "for a rectangular table, it is possible to compute the geo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 495.95,
"r_x1": 286.37,
"r_y1": 495.95,
"r_x2": 286.37,
"r_y2": 487.05,
"r_x3": 50.11,
"r_y3": 487.05,
"coord_origin": "TOPLEFT"
},
"text": "metrical border lines between the grid rows and columns.",
"orig": "metrical border lines between the grid rows and columns.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 507.91,
"r_x1": 286.37,
"r_y1": 507.91,
"r_x2": 286.37,
"r_y2": 499.0,
"r_x3": 50.11,
"r_y3": 499.0,
"coord_origin": "TOPLEFT"
},
"text": "Eventually this information is used to generate the missing",
"orig": "Eventually this information is used to generate the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 519.86,
"r_x1": 286.37,
"r_y1": 519.86,
"r_x2": 286.37,
"r_y2": 510.96,
"r_x3": 50.11,
"r_y3": 510.96,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes. Additionally, the existence of unused grid",
"orig": "bounding boxes. Additionally, the existence of unused grid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 531.82,
"r_x1": 286.37,
"r_y1": 531.82,
"r_x2": 286.37,
"r_y2": 522.91,
"r_x3": 50.11,
"r_y3": 522.91,
"coord_origin": "TOPLEFT"
},
"text": "squares indicates that the table rows have unequal number",
"orig": "squares indicates that the table rows have unequal number",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 543.77,
"r_x1": 286.37,
"r_y1": 543.77,
"r_x2": 286.37,
"r_y2": 534.87,
"r_x3": 50.11,
"r_y3": 534.87,
"coord_origin": "TOPLEFT"
},
"text": "of columns and the overall structure is non-strict. The gen-",
"orig": "of columns and the overall structure is non-strict. The gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 555.73,
"r_x1": 286.37,
"r_y1": 555.73,
"r_x2": 286.37,
"r_y2": 546.82,
"r_x3": 50.11,
"r_y3": 546.82,
"coord_origin": "TOPLEFT"
},
"text": "eration of missing bounding boxes for non-strict HTML ta-",
"orig": "eration of missing bounding boxes for non-strict HTML ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 567.68,
"r_x1": 257.47,
"r_y1": 567.68,
"r_x2": 257.47,
"r_y2": 558.78,
"r_x3": 50.11,
"r_y3": 558.78,
"coord_origin": "TOPLEFT"
},
"text": "bles is ambiguous and therefore quite challenging.",
"orig": "bles is ambiguous and therefore quite challenging.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.95,
"r_y0": 567.68,
"r_x1": 286.37,
"r_y1": 567.68,
"r_x2": 286.37,
"r_y2": 558.78,
"r_x3": 263.95,
"r_y3": 558.78,
"coord_origin": "TOPLEFT"
},
"text": "Thus,",
"orig": "Thus,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 579.64,
"r_x1": 286.37,
"r_y1": 579.64,
"r_x2": 286.37,
"r_y2": 570.73,
"r_x3": 50.11,
"r_y3": 570.73,
"coord_origin": "TOPLEFT"
},
"text": "we have decided to simply discard those tables. In case of",
"orig": "we have decided to simply discard those tables. In case of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 591.59,
"r_x1": 286.37,
"r_y1": 591.59,
"r_x2": 286.37,
"r_y2": 582.69,
"r_x3": 50.11,
"r_y3": 582.69,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet we have computed missing bounding boxes for",
"orig": "PubTabNet we have computed missing bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 603.55,
"r_x1": 286.37,
"r_y1": 603.55,
"r_x2": 286.37,
"r_y2": 594.64,
"r_x3": 50.11,
"r_y3": 594.64,
"coord_origin": "TOPLEFT"
},
"text": "48% of the simple and 69% of the complex tables. Regard-",
"orig": "48% of the simple and 69% of the complex tables. Regard-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 615.5,
"r_x1": 286.37,
"r_y1": 615.5,
"r_x2": 286.37,
"r_y2": 606.6,
"r_x3": 50.11,
"r_y3": 606.6,
"coord_origin": "TOPLEFT"
},
"text": "ing FinTabNet, 68% of the simple and 98% of the complex",
"orig": "ing FinTabNet, 68% of the simple and 98% of the complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 627.46,
"r_x1": 242.26,
"r_y1": 627.46,
"r_x2": 242.26,
"r_y2": 618.55,
"r_x3": 50.11,
"r_y3": 618.55,
"coord_origin": "TOPLEFT"
},
"text": "tables require the generation of bounding boxes.",
"orig": "tables require the generation of bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."
},
{
"label": "text",
"id": 14,
"page_no": 10,
"cluster": {
"id": 14,
"label": "text",
"bbox": {
"l": 50.11,
"t": 630.71,
"r": 286.36,
"b": 651.57,
"coord_origin": "TOPLEFT"
},
"confidence": 0.934,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 639.62,
"r_x1": 286.36,
"r_y1": 639.62,
"r_x2": 286.36,
"r_y2": 630.71,
"r_x3": 62.07,
"r_y3": 630.71,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7 illustrates the distribution of the tables across",
"orig": "Figure 7 illustrates the distribution of the tables across",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 651.57,
"r_x1": 179.9,
"r_y1": 651.57,
"r_x2": 179.9,
"r_y2": 642.67,
"r_x3": 50.11,
"r_y3": 642.67,
"coord_origin": "TOPLEFT"
},
"text": "different dimensions per dataset.",
"orig": "different dimensions per dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset."
},
{
"label": "section_header",
"id": 12,
"page_no": 10,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.11,
"t": 662.39,
"r": 153.61,
"b": 672.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.952,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 672.24,
"r_x1": 64.3,
"r_y1": 672.24,
"r_x2": 64.3,
"r_y2": 662.39,
"r_x3": 50.11,
"r_y3": 662.39,
"coord_origin": "TOPLEFT"
},
"text": "1.2.",
"orig": "1.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.75,
"r_y0": 672.24,
"r_x1": 153.61,
"r_y1": 672.24,
"r_x2": 153.61,
"r_y2": 662.39,
"r_x3": 73.75,
"r_y3": 662.39,
"coord_origin": "TOPLEFT"
},
"text": "Synthetic datasets",
"orig": "Synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1.2. Synthetic datasets"
},
{
"label": "text",
"id": 3,
"page_no": 10,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 681.33,
"r": 286.37,
"b": 714.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 690.24,
"r_x1": 286.36,
"r_y1": 690.24,
"r_x2": 286.36,
"r_y2": 681.33,
"r_x3": 62.07,
"r_y3": 681.33,
"coord_origin": "TOPLEFT"
},
"text": "Aiming to train and evaluate our models in a broader",
"orig": "Aiming to train and evaluate our models in a broader",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 702.19,
"r_x1": 286.37,
"r_y1": 702.19,
"r_x2": 286.37,
"r_y2": 693.29,
"r_x3": 50.11,
"r_y3": 693.29,
"coord_origin": "TOPLEFT"
},
"text": "spectrum of table data we have synthesized four types of",
"orig": "spectrum of table data we have synthesized four types of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 714.15,
"r_x1": 84.14,
"r_y1": 714.15,
"r_x2": 84.14,
"r_y2": 705.24,
"r_x3": 50.11,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "datasets.",
"orig": "datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.24,
"r_y0": 714.15,
"r_x1": 286.37,
"r_y1": 714.15,
"r_x2": 286.37,
"r_y2": 705.24,
"r_x3": 91.24,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "Each one contains tables with different appear-",
"orig": "Each one contains tables with different appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-"
},
{
"label": "text",
"id": 8,
"page_no": 10,
"cluster": {
"id": 8,
"label": "text",
"bbox": {
"l": 308.86,
"t": 162.66,
"r": 545.12,
"b": 207.43,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 171.56,
"r_x1": 545.12,
"r_y1": 171.56,
"r_x2": 545.12,
"r_y2": 162.66,
"r_x3": 308.86,
"r_y3": 162.66,
"coord_origin": "TOPLEFT"
},
"text": "ances in regard to their size, structure, style and content.",
"orig": "ances in regard to their size, structure, style and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 183.52,
"r_x1": 545.12,
"r_y1": 183.52,
"r_x2": 545.12,
"r_y2": 174.61,
"r_x3": 308.86,
"r_y3": 174.61,
"coord_origin": "TOPLEFT"
},
"text": "Every synthetic dataset contains 150k examples, summing",
"orig": "Every synthetic dataset contains 150k examples, summing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 195.47,
"r_x1": 545.12,
"r_y1": 195.47,
"r_x2": 545.12,
"r_y2": 186.57,
"r_x3": 308.86,
"r_y3": 186.57,
"coord_origin": "TOPLEFT"
},
"text": "up to 600k synthetic examples. All datasets are divided into",
"orig": "up to 600k synthetic examples. All datasets are divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 207.43,
"r_x1": 484.07,
"r_y1": 207.43,
"r_x2": 484.07,
"r_y2": 198.52,
"r_x3": 308.86,
"r_y3": 198.52,
"coord_origin": "TOPLEFT"
},
"text": "Train, Test and Val splits (80%, 10%, 10%).",
"orig": "Train, Test and Val splits (80%, 10%, 10%).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)."
},
{
"label": "text",
"id": 15,
"page_no": 10,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 308.86,
"t": 211.24,
"r": 545.12,
"b": 232.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 220.14,
"r_x1": 545.12,
"r_y1": 220.14,
"r_x2": 545.12,
"r_y2": 211.24,
"r_x3": 320.82,
"r_y3": 211.24,
"coord_origin": "TOPLEFT"
},
"text": "The process of generating a synthetic dataset can be de-",
"orig": "The process of generating a synthetic dataset can be de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 232.1,
"r_x1": 448.09,
"r_y1": 232.1,
"r_x2": 448.09,
"r_y2": 223.19,
"r_x3": 308.86,
"r_y3": 223.19,
"coord_origin": "TOPLEFT"
},
"text": "composed into the following steps:",
"orig": "composed into the following steps:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The process of generating a synthetic dataset can be decomposed into the following steps:"
},
{
"label": "list_item",
"id": 7,
"page_no": 10,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 235.91,
"r": 545.12,
"b": 316.54,
"coord_origin": "TOPLEFT"
},
"confidence": 0.964,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 244.81,
"r_x1": 328.29,
"r_y1": 244.81,
"r_x2": 328.29,
"r_y2": 235.91,
"r_x3": 320.82,
"r_y3": 235.91,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.38,
"r_y0": 244.81,
"r_x1": 545.11,
"r_y1": 244.81,
"r_x2": 545.11,
"r_y2": 235.91,
"r_x3": 335.38,
"r_y3": 235.91,
"coord_origin": "TOPLEFT"
},
"text": "Prepare styling and content templates: The styling",
"orig": "Prepare styling and content templates: The styling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 256.77,
"r_x1": 545.12,
"r_y1": 256.77,
"r_x2": 545.12,
"r_y2": 247.86,
"r_x3": 308.86,
"r_y3": 247.86,
"coord_origin": "TOPLEFT"
},
"text": "templates have been manually designed and organized into",
"orig": "templates have been manually designed and organized into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 268.72,
"r_x1": 545.12,
"r_y1": 268.72,
"r_x2": 545.12,
"r_y2": 259.82,
"r_x3": 308.86,
"r_y3": 259.82,
"coord_origin": "TOPLEFT"
},
"text": "groups of scope specific appearances (e.g. financial data,",
"orig": "groups of scope specific appearances (e.g. financial data,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 280.68,
"r_x1": 393.38,
"r_y1": 280.68,
"r_x2": 393.38,
"r_y2": 271.77,
"r_x3": 308.86,
"r_y3": 271.77,
"coord_origin": "TOPLEFT"
},
"text": "marketing data, etc.)",
"orig": "marketing data, etc.)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.12,
"r_y0": 280.68,
"r_x1": 545.12,
"r_y1": 280.68,
"r_x2": 545.12,
"r_y2": 271.77,
"r_x3": 400.12,
"r_y3": 271.77,
"coord_origin": "TOPLEFT"
},
"text": "Additionally, we have prepared cu-",
"orig": "Additionally, we have prepared cu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 292.63,
"r_x1": 545.12,
"r_y1": 292.63,
"r_x2": 545.12,
"r_y2": 283.73,
"r_x3": 308.86,
"r_y3": 283.73,
"coord_origin": "TOPLEFT"
},
"text": "rated collections of content templates by extracting the most",
"orig": "rated collections of content templates by extracting the most",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.59,
"r_x1": 545.12,
"r_y1": 304.59,
"r_x2": 545.12,
"r_y2": 295.68,
"r_x3": 308.86,
"r_y3": 295.68,
"coord_origin": "TOPLEFT"
},
"text": "frequently used terms out of non-synthetic datasets (e.g.",
"orig": "frequently used terms out of non-synthetic datasets (e.g.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.54,
"r_x1": 425.69,
"r_y1": 316.54,
"r_x2": 425.69,
"r_y2": 307.64,
"r_x3": 308.86,
"r_y3": 307.64,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet, FinTabNet, etc.).",
"orig": "PubTabNet, FinTabNet, etc.).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)."
},
{
"label": "list_item",
"id": 6,
"page_no": 10,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 320.35,
"r": 545.12,
"b": 448.81,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 329.26,
"r_x1": 328.49,
"r_y1": 329.26,
"r_x2": 328.49,
"r_y2": 320.35,
"r_x3": 320.82,
"r_y3": 320.35,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.05,
"r_y0": 329.26,
"r_x1": 545.11,
"r_y1": 329.26,
"r_x2": 545.11,
"r_y2": 320.35,
"r_x3": 331.05,
"r_y3": 320.35,
"coord_origin": "TOPLEFT"
},
"text": "Generate table structures: The structure of each syn-",
"orig": "Generate table structures: The structure of each syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 341.21,
"r_x1": 545.12,
"r_y1": 341.21,
"r_x2": 545.12,
"r_y2": 332.31,
"r_x3": 308.86,
"r_y3": 332.31,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset assumes a horizontal table header which po-",
"orig": "thetic dataset assumes a horizontal table header which po-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 353.17,
"r_x1": 545.12,
"r_y1": 353.17,
"r_x2": 545.12,
"r_y2": 344.26,
"r_x3": 308.86,
"r_y3": 344.26,
"coord_origin": "TOPLEFT"
},
"text": "tentially spans over multiple rows and a table body that",
"orig": "tentially spans over multiple rows and a table body that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 365.12,
"r_x1": 545.12,
"r_y1": 365.12,
"r_x2": 545.12,
"r_y2": 356.22,
"r_x3": 308.86,
"r_y3": 356.22,
"coord_origin": "TOPLEFT"
},
"text": "may contain a combination of row spans and column spans.",
"orig": "may contain a combination of row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 377.08,
"r_x1": 545.12,
"r_y1": 377.08,
"r_x2": 545.12,
"r_y2": 368.17,
"r_x3": 308.86,
"r_y3": 368.17,
"coord_origin": "TOPLEFT"
},
"text": "However, spans are not allowed to cross the header - body",
"orig": "However, spans are not allowed to cross the header - body",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 389.03,
"r_x1": 545.11,
"r_y1": 389.03,
"r_x2": 545.11,
"r_y2": 380.13,
"r_x3": 308.86,
"r_y3": 380.13,
"coord_origin": "TOPLEFT"
},
"text": "boundary. The table structure is described by the parame-",
"orig": "boundary. The table structure is described by the parame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 400.99,
"r_x1": 545.12,
"r_y1": 400.99,
"r_x2": 545.12,
"r_y2": 392.08,
"r_x3": 308.86,
"r_y3": 392.08,
"coord_origin": "TOPLEFT"
},
"text": "ters: Total number of table rows and columns, number of",
"orig": "ters: Total number of table rows and columns, number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.94,
"r_x1": 545.12,
"r_y1": 412.94,
"r_x2": 545.12,
"r_y2": 404.04,
"r_x3": 308.86,
"r_y3": 404.04,
"coord_origin": "TOPLEFT"
},
"text": "header rows, type of spans (header only spans, row only",
"orig": "header rows, type of spans (header only spans, row only",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.9,
"r_x1": 545.11,
"r_y1": 424.9,
"r_x2": 545.11,
"r_y2": 415.99,
"r_x3": 308.86,
"r_y3": 415.99,
"coord_origin": "TOPLEFT"
},
"text": "spans, column only spans, both row and column spans),",
"orig": "spans, column only spans, both row and column spans),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.85,
"r_x1": 545.12,
"r_y1": 436.85,
"r_x2": 545.12,
"r_y2": 427.95,
"r_x3": 308.86,
"r_y3": 427.95,
"coord_origin": "TOPLEFT"
},
"text": "maximum span size and the ratio of the table area covered",
"orig": "maximum span size and the ratio of the table area covered",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.81,
"r_x1": 345.94,
"r_y1": 448.81,
"r_x2": 345.94,
"r_y2": 439.9,
"r_x3": 308.86,
"r_y3": 439.9,
"coord_origin": "TOPLEFT"
},
"text": "by spans.",
"orig": "by spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans."
},
{
"label": "list_item",
"id": 9,
"page_no": 10,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 452.62,
"r": 545.12,
"b": 497.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.957,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 461.52,
"r_x1": 328.3,
"r_y1": 461.52,
"r_x2": 328.3,
"r_y2": 452.62,
"r_x3": 320.82,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.8,
"r_y0": 461.52,
"r_x1": 485.76,
"r_y1": 461.52,
"r_x2": 485.76,
"r_y2": 452.62,
"r_x3": 330.8,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": "Generate content: Based on the dataset",
"orig": "Generate content: Based on the dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.07,
"r_y0": 461.29,
"r_x1": 511.86,
"r_y1": 461.29,
"r_x2": 511.86,
"r_y2": 452.71,
"r_x3": 488.07,
"r_y3": 452.71,
"coord_origin": "TOPLEFT"
},
"text": "theme",
"orig": "theme",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.86,
"r_y0": 461.52,
"r_x1": 545.11,
"r_y1": 461.52,
"r_x2": 545.11,
"r_y2": 452.62,
"r_x3": 511.86,
"r_y3": 452.62,
"coord_origin": "TOPLEFT"
},
"text": ", a set of",
"orig": ", a set of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 473.48,
"r_x1": 545.12,
"r_y1": 473.48,
"r_x2": 545.12,
"r_y2": 464.57,
"r_x3": 308.86,
"r_y3": 464.57,
"coord_origin": "TOPLEFT"
},
"text": "suitable content templates is chosen first. Then, this content",
"orig": "suitable content templates is chosen first. Then, this content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 485.43,
"r_x1": 545.12,
"r_y1": 485.43,
"r_x2": 545.12,
"r_y2": 476.53,
"r_x3": 308.86,
"r_y3": 476.53,
"coord_origin": "TOPLEFT"
},
"text": "can be combined with purely random text to produce the",
"orig": "can be combined with purely random text to produce the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 497.39,
"r_x1": 379.15,
"r_y1": 497.39,
"r_x2": 379.15,
"r_y2": 488.48,
"r_x3": 308.86,
"r_y3": 488.48,
"coord_origin": "TOPLEFT"
},
"text": "synthetic content.",
"orig": "synthetic content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content."
},
{
"label": "list_item",
"id": 5,
"page_no": 10,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 501.2,
"r": 545.12,
"b": 545.97,
"coord_origin": "TOPLEFT"
},
"confidence": 0.971,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 510.1,
"r_x1": 328.66,
"r_y1": 510.1,
"r_x2": 328.66,
"r_y2": 501.2,
"r_x3": 320.82,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.28,
"r_y0": 510.1,
"r_x1": 545.11,
"r_y1": 510.1,
"r_x2": 545.11,
"r_y2": 501.2,
"r_x3": 331.28,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "Apply styling templates: Depending on the domain",
"orig": "Apply styling templates: Depending on the domain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 522.06,
"r_x1": 545.12,
"r_y1": 522.06,
"r_x2": 545.12,
"r_y2": 513.15,
"r_x3": 308.86,
"r_y3": 513.15,
"coord_origin": "TOPLEFT"
},
"text": "of the synthetic dataset, a set of styling templates is first",
"orig": "of the synthetic dataset, a set of styling templates is first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 534.01,
"r_x1": 384.3,
"r_y1": 534.01,
"r_x2": 384.3,
"r_y2": 525.11,
"r_x3": 308.86,
"r_y3": 525.11,
"coord_origin": "TOPLEFT"
},
"text": "manually selected.",
"orig": "manually selected.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.25,
"r_y0": 534.01,
"r_x1": 545.12,
"r_y1": 534.01,
"r_x2": 545.12,
"r_y2": 525.11,
"r_x3": 391.25,
"r_y3": 525.11,
"coord_origin": "TOPLEFT"
},
"text": "Then, a style is randomly selected to",
"orig": "Then, a style is randomly selected to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 545.97,
"r_x1": 496.16,
"r_y1": 545.97,
"r_x2": 496.16,
"r_y2": 537.06,
"r_x3": 308.86,
"r_y3": 537.06,
"coord_origin": "TOPLEFT"
},
"text": "format the appearance of the synthesized table.",
"orig": "format the appearance of the synthesized table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table."
},
{
"label": "list_item",
"id": 4,
"page_no": 10,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 549.78,
"r": 545.12,
"b": 606.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.978,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 558.68,
"r_x1": 328.29,
"r_y1": 558.68,
"r_x2": 328.29,
"r_y2": 549.78,
"r_x3": 320.82,
"r_y3": 549.78,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 558.68,
"r_x1": 545.11,
"r_y1": 558.68,
"r_x2": 545.11,
"r_y2": 549.78,
"r_x3": 335.4,
"r_y3": 549.78,
"coord_origin": "TOPLEFT"
},
"text": "Render the complete tables: The synthetic table is",
"orig": "Render the complete tables: The synthetic table is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 570.64,
"r_x1": 545.12,
"r_y1": 570.64,
"r_x2": 545.12,
"r_y2": 561.73,
"r_x3": 308.86,
"r_y3": 561.73,
"coord_origin": "TOPLEFT"
},
"text": "finally rendered by a web browser engine to generate the",
"orig": "finally rendered by a web browser engine to generate the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 582.59,
"r_x1": 545.12,
"r_y1": 582.59,
"r_x2": 545.12,
"r_y2": 573.69,
"r_x3": 308.86,
"r_y3": 573.69,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes for each table cell. A batching technique is",
"orig": "bounding boxes for each table cell. A batching technique is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 594.55,
"r_x1": 545.12,
"r_y1": 594.55,
"r_x2": 545.12,
"r_y2": 585.64,
"r_x3": 308.86,
"r_y3": 585.64,
"coord_origin": "TOPLEFT"
},
"text": "utilized to optimize the runtime overhead of the rendering",
"orig": "utilized to optimize the runtime overhead of the rendering",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 606.5,
"r_x1": 341.23,
"r_y1": 606.5,
"r_x2": 341.23,
"r_y2": 597.6,
"r_x3": 308.86,
"r_y3": 597.6,
"coord_origin": "TOPLEFT"
},
"text": "process.",
"orig": "process.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process."
},
{
"label": "section_header",
"id": 10,
"page_no": 10,
"cluster": {
"id": 10,
"label": "section_header",
"bbox": {
"l": 308.86,
"t": 622.29,
"r": 545.11,
"b": 646.99,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 633.04,
"r_x1": 316.77,
"r_y1": 633.04,
"r_x2": 316.77,
"r_y2": 622.29,
"r_x3": 308.86,
"r_y3": 622.29,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.31,
"r_y0": 633.04,
"r_x1": 545.11,
"r_y1": 633.04,
"r_x2": 545.11,
"r_y2": 622.29,
"r_x3": 327.31,
"r_y3": 622.29,
"coord_origin": "TOPLEFT"
},
"text": "Prediction post-processing for PDF docu-",
"orig": "Prediction post-processing for PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 646.99,
"r_x1": 357.34,
"r_y1": 646.99,
"r_x2": 357.34,
"r_y2": 636.24,
"r_x3": 326.8,
"r_y3": 636.24,
"coord_origin": "TOPLEFT"
},
"text": "ments",
"orig": "ments",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Prediction post-processing for PDF documents"
},
{
"label": "text",
"id": 1,
"page_no": 10,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.86,
"t": 657.42,
"r": 545.12,
"b": 714.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.983,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 666.33,
"r_x1": 545.11,
"r_y1": 666.33,
"r_x2": 545.11,
"r_y2": 657.42,
"r_x3": 320.82,
"r_y3": 657.42,
"coord_origin": "TOPLEFT"
},
"text": "Although TableFormer can predict the table structure and",
"orig": "Although TableFormer can predict the table structure and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 678.28,
"r_x1": 545.12,
"r_y1": 678.28,
"r_x2": 545.12,
"r_y2": 669.38,
"r_x3": 308.86,
"r_y3": 669.38,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes for tables recognized inside PDF docu-",
"orig": "the bounding boxes for tables recognized inside PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 690.24,
"r_x1": 545.12,
"r_y1": 690.24,
"r_x2": 545.12,
"r_y2": 681.33,
"r_x3": 308.86,
"r_y3": 681.33,
"coord_origin": "TOPLEFT"
},
"text": "ments, this is not enough when a full reconstruction of the",
"orig": "ments, this is not enough when a full reconstruction of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 702.19,
"r_x1": 545.12,
"r_y1": 702.19,
"r_x2": 545.12,
"r_y2": 693.29,
"r_x3": 308.86,
"r_y3": 693.29,
"coord_origin": "TOPLEFT"
},
"text": "original table is required. This happens mainly due the fol-",
"orig": "original table is required. This happens mainly due the fol-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 714.15,
"r_x1": 371.43,
"r_y1": 714.15,
"r_x2": 371.43,
"r_y2": 705.24,
"r_x3": 308.86,
"r_y3": 705.24,
"coord_origin": "TOPLEFT"
},
"text": "lowing reasons:",
"orig": "lowing reasons:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:"
}
],
"headers": [
{
"label": "page_footer",
"id": 16,
"page_no": 10,
"cluster": {
"id": 16,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.899,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "11"
}
]
}
},
{
"page_no": 11,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.39,
"r_y0": 83.26,
"r_x1": 151.95,
"r_y1": 83.26,
"r_x2": 151.95,
"r_y2": 77.31,
"r_x3": 119.39,
"r_y3": 77.31,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.35,
"r_y0": 81.14,
"r_x1": 59.33,
"r_y1": 81.14,
"r_x2": 59.33,
"r_y2": 75.19,
"r_x3": 53.35,
"r_y3": 75.19,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.58,
"r_y0": 83.41,
"r_x1": 319.83,
"r_y1": 83.41,
"r_x2": 319.83,
"r_y2": 77.46,
"r_x3": 289.58,
"r_y3": 77.46,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.37,
"r_y0": 83.2,
"r_x1": 481.76,
"r_y1": 83.2,
"r_x2": 481.76,
"r_y2": 77.25,
"r_x3": 448.37,
"r_y3": 77.25,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.55,
"r_y0": 146.23,
"r_x1": 94.98,
"r_y1": 146.23,
"r_x2": 94.98,
"r_y2": 141.28,
"r_x3": 82.55,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.04,
"r_y0": 106.06,
"r_x1": 85.29,
"r_y1": 106.06,
"r_x2": 85.29,
"r_y2": 101.1,
"r_x3": 63.04,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 129.35,
"r_x1": 85.23,
"r_y1": 129.35,
"r_x2": 85.23,
"r_y2": 124.4,
"r_x3": 67.77,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.55,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.54,
"r_x3": 227.55,
"r_y3": 102.54,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.94,
"r_x1": 249.66,
"r_y1": 131.94,
"r_x2": 249.66,
"r_y2": 126.99,
"r_x3": 232.2,
"r_y3": 126.99,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.23,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.05,
"r_x3": 396.23,
"r_y3": 114.05,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.38,
"r_y0": 146.23,
"r_x1": 105.08,
"r_y1": 146.23,
"r_x2": 105.08,
"r_y2": 141.28,
"r_x3": 97.38,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.94,
"r_y0": 90.69,
"r_x1": 76.15,
"r_y1": 90.69,
"r_x2": 76.15,
"r_y2": 85.73,
"r_x3": 60.94,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.18,
"r_x1": 106.99,
"r_y1": 91.18,
"r_x2": 106.99,
"r_y2": 86.22,
"r_x3": 82.3,
"r_y3": 86.22,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.21,
"r_y0": 146.56,
"r_x1": 281.88,
"r_y1": 146.56,
"r_x2": 281.88,
"r_y2": 141.61,
"r_x3": 246.21,
"r_y3": 141.61,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.69,
"r_x1": 241.91,
"r_y1": 90.69,
"r_x2": 241.91,
"r_y2": 85.73,
"r_x3": 226.7,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.94,
"r_y0": 91.05,
"r_x1": 282.49,
"r_y1": 91.05,
"r_x2": 282.49,
"r_y2": 86.09,
"r_x3": 249.94,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.19,
"r_y0": 146.23,
"r_x1": 444.69,
"r_y1": 146.23,
"r_x2": 444.69,
"r_y2": 141.28,
"r_x3": 410.19,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 90.69,
"r_x1": 432.67,
"r_y1": 90.69,
"r_x2": 432.67,
"r_y2": 85.73,
"r_x3": 391.37,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.61,
"r_y0": 91.22,
"r_x1": 445.62,
"r_y1": 91.22,
"r_x2": 445.62,
"r_y2": 86.26,
"r_x3": 435.61,
"r_y3": 86.26,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.95,
"r_y0": 146.25,
"r_x1": 136.2,
"r_y1": 146.25,
"r_x2": 136.2,
"r_y2": 141.29,
"r_x3": 113.95,
"r_y3": 141.29,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.92,
"r_y0": 99.78,
"r_x1": 127.05,
"r_y1": 99.78,
"r_x2": 127.05,
"r_y2": 94.82,
"r_x3": 116.92,
"r_y3": 94.82,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.31,
"r_y0": 105.9,
"r_x1": 127.05,
"r_y1": 105.9,
"r_x2": 127.05,
"r_y2": 100.94,
"r_x3": 113.31,
"r_y3": 100.94,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.94,
"r_y0": 112.02,
"r_x1": 127.06,
"r_y1": 112.02,
"r_x2": 127.06,
"r_y2": 107.06,
"r_x3": 112.94,
"r_y3": 107.06,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.23,
"r_y0": 127.57,
"r_x1": 126.97,
"r_y1": 127.57,
"r_x2": 126.97,
"r_y2": 122.62,
"r_x3": 113.23,
"r_y3": 122.62,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.85,
"r_y0": 133.69,
"r_x1": 126.97,
"r_y1": 133.69,
"r_x2": 126.97,
"r_y2": 128.74,
"r_x3": 112.85,
"r_y3": 128.74,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.58,
"r_y0": 146.39,
"r_x1": 156.04,
"r_y1": 146.39,
"r_x2": 156.04,
"r_y2": 141.44,
"r_x3": 138.58,
"r_y3": 141.44,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.03,
"r_y0": 91.23,
"r_x1": 151.04,
"r_y1": 91.23,
"r_x2": 151.04,
"r_y2": 86.27,
"r_x3": 122.03,
"r_y3": 86.27,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.65,
"r_y0": 91.51,
"r_x1": 321.67,
"r_y1": 91.51,
"r_x2": 321.67,
"r_y2": 86.55,
"r_x3": 311.65,
"r_y3": 86.55,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.89,
"r_y0": 146.67,
"r_x1": 310.15,
"r_y1": 146.67,
"r_x2": 310.15,
"r_y2": 141.71,
"r_x3": 287.89,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.24,
"r_y0": 98.04,
"r_x1": 299.37,
"r_y1": 98.04,
"r_x2": 299.37,
"r_y2": 93.08,
"r_x3": 289.24,
"r_y3": 93.08,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.64,
"r_y0": 104.16,
"r_x1": 299.37,
"r_y1": 104.16,
"r_x2": 299.37,
"r_y2": 99.2,
"r_x3": 285.64,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.26,
"r_y0": 110.28,
"r_x1": 299.38,
"r_y1": 110.28,
"r_x2": 299.38,
"r_y2": 105.32,
"r_x3": 285.26,
"r_y3": 105.32,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.43,
"r_y0": 125.35,
"r_x1": 299.17,
"r_y1": 125.35,
"r_x2": 299.17,
"r_y2": 120.39,
"r_x3": 285.43,
"r_y3": 120.39,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.06,
"r_y0": 131.47,
"r_x1": 299.17,
"r_y1": 131.47,
"r_x2": 299.17,
"r_y2": 126.51,
"r_x3": 285.06,
"r_y3": 126.51,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.35,
"r_y0": 146.67,
"r_x1": 328.81,
"r_y1": 146.67,
"r_x2": 328.81,
"r_y2": 141.71,
"r_x3": 311.35,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.58,
"r_y0": 91.65,
"r_x1": 309.6,
"r_y1": 91.65,
"r_x2": 309.6,
"r_y2": 86.69,
"r_x3": 299.58,
"r_y3": 86.69,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.04,
"r_y0": 146.63,
"r_x1": 483.5,
"r_y1": 146.63,
"r_x2": 483.5,
"r_y2": 141.67,
"r_x3": 466.04,
"r_y3": 141.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.02,
"r_y0": 98.72,
"r_x1": 469.16,
"r_y1": 98.72,
"r_x2": 469.16,
"r_y2": 93.76,
"r_x3": 459.02,
"r_y3": 93.76,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.42,
"r_y0": 104.84,
"r_x1": 469.16,
"r_y1": 104.84,
"r_x2": 469.16,
"r_y2": 99.88,
"r_x3": 455.42,
"r_y3": 99.88,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.05,
"r_y0": 110.96,
"r_x1": 469.16,
"r_y1": 110.96,
"r_x2": 469.16,
"r_y2": 106.0,
"r_x3": 455.05,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.39,
"r_y0": 90.53,
"r_x1": 480.65,
"r_y1": 90.53,
"r_x2": 480.65,
"r_y2": 85.57,
"r_x3": 467.39,
"r_y3": 85.57,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.38,
"r_y0": 146.54,
"r_x1": 182.63,
"r_y1": 146.54,
"r_x2": 182.63,
"r_y2": 141.58,
"r_x3": 160.38,
"r_y3": 141.58,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.74,
"r_y0": 99.82,
"r_x1": 173.33,
"r_y1": 99.82,
"r_x2": 173.33,
"r_y2": 94.86,
"r_x3": 153.74,
"r_y3": 94.86,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.51,
"r_y0": 105.94,
"r_x1": 173.32,
"r_y1": 105.94,
"r_x2": 173.32,
"r_y2": 100.98,
"r_x3": 154.51,
"r_y3": 100.98,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.27,
"r_y0": 112.06,
"r_x1": 173.33,
"r_y1": 112.06,
"r_x2": 173.33,
"r_y2": 107.1,
"r_x3": 155.27,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.41,
"r_y0": 112.19,
"r_x1": 346.0,
"r_y1": 112.19,
"r_x2": 346.0,
"r_y2": 107.23,
"r_x3": 326.41,
"r_y3": 107.23,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.18,
"r_y0": 118.31,
"r_x1": 345.99,
"r_y1": 118.31,
"r_x2": 345.99,
"r_y2": 113.35,
"r_x3": 327.18,
"r_y3": 113.35,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.94,
"r_y0": 124.43,
"r_x1": 346.0,
"r_y1": 124.43,
"r_x2": 346.0,
"r_y2": 119.47,
"r_x3": 327.94,
"r_y3": 119.47,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.99,
"r_y0": 109.11,
"r_x1": 508.76,
"r_y1": 109.11,
"r_x2": 508.76,
"r_y2": 104.15,
"r_x3": 488.99,
"r_y3": 104.15,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.19,
"r_y0": 115.23,
"r_x1": 508.76,
"r_y1": 115.23,
"r_x2": 508.76,
"r_y2": 110.27,
"r_x3": 490.19,
"r_y3": 110.27,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.72,
"r_y0": 121.35,
"r_x1": 508.77,
"r_y1": 121.35,
"r_x2": 508.77,
"r_y2": 116.39,
"r_x3": 489.72,
"r_y3": 116.39,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.71,
"r_y0": 127.47,
"r_x1": 508.77,
"r_y1": 127.47,
"r_x2": 508.77,
"r_y2": 122.51,
"r_x3": 490.71,
"r_y3": 122.51,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.38,
"r_y0": 146.67,
"r_x1": 202.84,
"r_y1": 146.67,
"r_x2": 202.84,
"r_y2": 141.71,
"r_x3": 185.38,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.09,
"r_x1": 197.53,
"r_y1": 91.09,
"r_x2": 197.53,
"r_y2": 86.14,
"r_x3": 168.5,
"r_y3": 86.14,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.38,
"r_y0": 90.95,
"r_x1": 367.4,
"r_y1": 90.95,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.38,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.73,
"r_y0": 146.58,
"r_x1": 374.93,
"r_y1": 146.58,
"r_x2": 374.93,
"r_y2": 141.62,
"r_x3": 333.73,
"r_y3": 141.62,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.69,
"r_y0": 91.01,
"r_x1": 355.71,
"r_y1": 91.01,
"r_x2": 355.71,
"r_y2": 86.06,
"r_x3": 345.69,
"r_y3": 86.06,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.54,
"r_y0": 146.33,
"r_x1": 526.01,
"r_y1": 146.33,
"r_x2": 526.01,
"r_y2": 141.38,
"r_x3": 508.54,
"r_y3": 141.38,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.45,
"r_y0": 91.05,
"r_x1": 523.71,
"r_y1": 91.05,
"r_x2": 523.71,
"r_y2": 86.09,
"r_x3": 510.45,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 174.41,
"r_x1": 545.11,
"r_y1": 174.41,
"r_x2": 545.11,
"r_y2": 165.5,
"r_x3": 50.11,
"r_y3": 165.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 186.36,
"r_x1": 513.52,
"r_y1": 186.36,
"r_x2": 513.52,
"r_y2": 177.46,
"r_x3": 50.11,
"r_y3": 177.46,
"coord_origin": "TOPLEFT"
},
"text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 219.84,
"r_x1": 71.15,
"r_y1": 219.84,
"r_x2": 71.15,
"r_y2": 210.93,
"r_x3": 61.57,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.54,
"r_y0": 219.84,
"r_x1": 286.37,
"r_y1": 219.84,
"r_x2": 286.37,
"r_y2": 210.93,
"r_x3": 73.54,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer output does not include the table cell con-",
"orig": "TableFormer output does not include the table cell con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 231.79,
"r_x1": 87.47,
"r_y1": 231.79,
"r_x2": 87.47,
"r_y2": 222.89,
"r_x3": 70.04,
"r_y3": 222.89,
"coord_origin": "TOPLEFT"
},
"text": "tent.",
"orig": "tent.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 252.98,
"r_x1": 71.35,
"r_y1": 252.98,
"r_x2": 71.35,
"r_y2": 244.07,
"r_x3": 61.57,
"r_y3": 244.07,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.79,
"r_y0": 252.98,
"r_x1": 286.37,
"r_y1": 252.98,
"r_x2": 286.37,
"r_y2": 244.07,
"r_x3": 73.79,
"r_y3": 244.07,
"coord_origin": "TOPLEFT"
},
"text": "There are occasional inaccuracies in the predictions of",
"orig": "There are occasional inaccuracies in the predictions of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 264.93,
"r_x1": 150.42,
"r_y1": 264.93,
"r_x2": 150.42,
"r_y2": 256.03,
"r_x3": 70.04,
"r_y3": 256.03,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes.",
"orig": "the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 288.11,
"r_x1": 286.36,
"r_y1": 288.11,
"r_x2": 286.36,
"r_y2": 279.2,
"r_x3": 62.07,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "However, it is possible to mitigate those limitations by",
"orig": "However, it is possible to mitigate those limitations by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.06,
"r_x1": 286.37,
"r_y1": 300.06,
"r_x2": 286.37,
"r_y2": 291.16,
"r_x3": 50.11,
"r_y3": 291.16,
"coord_origin": "TOPLEFT"
},
"text": "combining the TableFormer predictions with the informa-",
"orig": "combining the TableFormer predictions with the informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.02,
"r_x1": 286.37,
"r_y1": 312.02,
"r_x2": 286.37,
"r_y2": 303.11,
"r_x3": 50.11,
"r_y3": 303.11,
"coord_origin": "TOPLEFT"
},
"text": "tion already present inside a programmatic PDF document.",
"orig": "tion already present inside a programmatic PDF document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 323.97,
"r_x1": 286.37,
"r_y1": 323.97,
"r_x2": 286.37,
"r_y2": 315.07,
"r_x3": 50.11,
"r_y3": 315.07,
"coord_origin": "TOPLEFT"
},
"text": "More specifically, PDF documents can be seen as a se-",
"orig": "More specifically, PDF documents can be seen as a se-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 335.93,
"r_x1": 286.37,
"r_y1": 335.93,
"r_x2": 286.37,
"r_y2": 327.02,
"r_x3": 50.11,
"r_y3": 327.02,
"coord_origin": "TOPLEFT"
},
"text": "quence of PDF cells where each cell is described by its con-",
"orig": "quence of PDF cells where each cell is described by its con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 347.89,
"r_x1": 286.37,
"r_y1": 347.89,
"r_x2": 286.37,
"r_y2": 338.98,
"r_x3": 50.11,
"r_y3": 338.98,
"coord_origin": "TOPLEFT"
},
"text": "tent and bounding box. If we are able to associate the PDF",
"orig": "tent and bounding box. If we are able to associate the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.84,
"r_x1": 286.37,
"r_y1": 359.84,
"r_x2": 286.37,
"r_y2": 350.93,
"r_x3": 50.11,
"r_y3": 350.93,
"coord_origin": "TOPLEFT"
},
"text": "cells with the predicted table cells, we can directly link the",
"orig": "cells with the predicted table cells, we can directly link the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.8,
"r_x1": 286.37,
"r_y1": 371.8,
"r_x2": 286.37,
"r_y2": 362.89,
"r_x3": 50.11,
"r_y3": 362.89,
"coord_origin": "TOPLEFT"
},
"text": "PDF cell content to the table cell structure and use the PDF",
"orig": "PDF cell content to the table cell structure and use the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 383.75,
"r_x1": 286.37,
"r_y1": 383.75,
"r_x2": 286.37,
"r_y2": 374.84,
"r_x3": 50.11,
"r_y3": 374.84,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes to correct misalignments in the predicted",
"orig": "bounding boxes to correct misalignments in the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 395.71,
"r_x1": 154.56,
"r_y1": 395.71,
"r_x2": 154.56,
"r_y2": 386.8,
"r_x3": 50.11,
"r_y3": 386.8,
"coord_origin": "TOPLEFT"
},
"text": "table cell bounding boxes.",
"orig": "table cell bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 407.98,
"r_x1": 286.36,
"r_y1": 407.98,
"r_x2": 286.36,
"r_y2": 399.07,
"r_x3": 62.07,
"r_y3": 399.07,
"coord_origin": "TOPLEFT"
},
"text": "Here is a step-by-step description of the prediction post-",
"orig": "Here is a step-by-step description of the prediction post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 419.93,
"r_x1": 95.49,
"r_y1": 419.93,
"r_x2": 95.49,
"r_y2": 411.03,
"r_x3": 50.11,
"r_y3": 411.03,
"coord_origin": "TOPLEFT"
},
"text": "processing:",
"orig": "processing:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 432.2,
"r_x1": 69.37,
"r_y1": 432.2,
"r_x2": 69.37,
"r_y2": 423.3,
"r_x3": 62.07,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.81,
"r_y0": 432.2,
"r_x1": 286.37,
"r_y1": 432.2,
"r_x2": 286.37,
"r_y2": 423.3,
"r_x3": 71.81,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "Get the minimal grid dimensions - number of rows and",
"orig": "Get the minimal grid dimensions - number of rows and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 444.16,
"r_x1": 286.37,
"r_y1": 444.16,
"r_x2": 286.37,
"r_y2": 435.25,
"r_x3": 50.11,
"r_y3": 435.25,
"coord_origin": "TOPLEFT"
},
"text": "columns for the predicted table structure. This represents",
"orig": "columns for the predicted table structure. This represents",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 456.11,
"r_x1": 274.51,
"r_y1": 456.11,
"r_x2": 274.51,
"r_y2": 447.21,
"r_x3": 50.11,
"r_y3": 447.21,
"coord_origin": "TOPLEFT"
},
"text": "the most granular grid for the underlying table structure.",
"orig": "the most granular grid for the underlying table structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 468.38,
"r_x1": 69.54,
"r_y1": 468.38,
"r_x2": 69.54,
"r_y2": 459.48,
"r_x3": 62.07,
"r_y3": 459.48,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 77.43,
"r_y0": 468.38,
"r_x1": 286.36,
"r_y1": 468.38,
"r_x2": 286.36,
"r_y2": 459.48,
"r_x3": 77.43,
"r_y3": 459.48,
"coord_origin": "TOPLEFT"
},
"text": "Generate pair-wise matches between the bounding",
"orig": "Generate pair-wise matches between the bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 480.34,
"r_x1": 286.37,
"r_y1": 480.34,
"r_x2": 286.37,
"r_y2": 471.43,
"r_x3": 50.11,
"r_y3": 471.43,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the PDF cells and the predicted cells. The Intersec-",
"orig": "boxes of the PDF cells and the predicted cells. The Intersec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 492.29,
"r_x1": 286.37,
"r_y1": 492.29,
"r_x2": 286.37,
"r_y2": 483.39,
"r_x3": 50.11,
"r_y3": 483.39,
"coord_origin": "TOPLEFT"
},
"text": "tion Over Union (IOU) metric is used to evaluate the quality",
"orig": "tion Over Union (IOU) metric is used to evaluate the quality",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 504.25,
"r_x1": 110.7,
"r_y1": 504.25,
"r_x2": 110.7,
"r_y2": 495.34,
"r_x3": 50.11,
"r_y3": 495.34,
"coord_origin": "TOPLEFT"
},
"text": "of the matches.",
"orig": "of the matches.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 516.52,
"r_x1": 69.86,
"r_y1": 516.52,
"r_x2": 69.86,
"r_y2": 507.61,
"r_x3": 62.07,
"r_y3": 507.61,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.46,
"r_y0": 516.52,
"r_x1": 286.36,
"r_y1": 516.52,
"r_x2": 286.36,
"r_y2": 507.61,
"r_x3": 72.46,
"r_y3": 507.61,
"coord_origin": "TOPLEFT"
},
"text": "Use a carefully selected IOU threshold to designate",
"orig": "Use a carefully selected IOU threshold to designate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 528.47,
"r_x1": 226.07,
"r_y1": 528.47,
"r_x2": 226.07,
"r_y2": 519.57,
"r_x3": 50.11,
"r_y3": 519.57,
"coord_origin": "TOPLEFT"
},
"text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 540.74,
"r_x1": 286.36,
"r_y1": 540.74,
"r_x2": 286.36,
"r_y2": 531.84,
"r_x3": 62.07,
"r_y3": 531.84,
"coord_origin": "TOPLEFT"
},
"text": "3.a. If all IOU scores in a column are below the thresh-",
"orig": "3.a. If all IOU scores in a column are below the thresh-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 552.7,
"r_x1": 286.37,
"r_y1": 552.7,
"r_x2": 286.37,
"r_y2": 543.79,
"r_x3": 50.11,
"r_y3": 543.79,
"coord_origin": "TOPLEFT"
},
"text": "old, discard all predictions (structure and bounding boxes)",
"orig": "old, discard all predictions (structure and bounding boxes)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 564.65,
"r_x1": 114.03,
"r_y1": 564.65,
"r_x2": 114.03,
"r_y2": 555.75,
"r_x3": 50.11,
"r_y3": 555.75,
"coord_origin": "TOPLEFT"
},
"text": "for that column.",
"orig": "for that column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 576.92,
"r_x1": 69.54,
"r_y1": 576.92,
"r_x2": 69.54,
"r_y2": 568.02,
"r_x3": 62.07,
"r_y3": 568.02,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.73,
"r_y0": 576.92,
"r_x1": 286.37,
"r_y1": 576.92,
"r_x2": 286.37,
"r_y2": 568.02,
"r_x3": 76.73,
"r_y3": 568.02,
"coord_origin": "TOPLEFT"
},
"text": "Find the best-fitting content alignment for the pre-",
"orig": "Find the best-fitting content alignment for the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 588.88,
"r_x1": 286.37,
"r_y1": 588.88,
"r_x2": 286.37,
"r_y2": 579.97,
"r_x3": 50.11,
"r_y3": 579.97,
"coord_origin": "TOPLEFT"
},
"text": "dicted cells with good IOU per each column. The alignment",
"orig": "dicted cells with good IOU per each column. The alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 600.83,
"r_x1": 278.7,
"r_y1": 600.83,
"r_x2": 278.7,
"r_y2": 591.93,
"r_x3": 50.11,
"r_y3": 591.93,
"coord_origin": "TOPLEFT"
},
"text": "of the column can be identified by the following formula:",
"orig": "of the column can be identified by the following formula:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.03,
"r_y0": 632.84,
"r_x1": 157.95,
"r_y1": 632.84,
"r_x2": 157.95,
"r_y2": 623.99,
"r_x3": 112.03,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "alignment",
"orig": "alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.72,
"r_y0": 632.84,
"r_x1": 203.5,
"r_y1": 632.84,
"r_x2": 203.5,
"r_y2": 623.99,
"r_x3": 160.72,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "= arg min",
"orig": "= arg min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.58,
"r_y0": 640.18,
"r_x1": 189.15,
"r_y1": 640.18,
"r_x2": 189.15,
"r_y2": 633.98,
"r_x3": 185.58,
"r_y3": 633.98,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 203.5,
"r_y0": 632.84,
"r_x1": 208.48,
"r_y1": 632.84,
"r_x2": 208.48,
"r_y2": 623.44,
"r_x3": 203.5,
"r_y3": 623.44,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.48,
"r_y0": 632.84,
"r_x1": 220.29,
"r_y1": 632.84,
"r_x2": 220.29,
"r_y2": 623.99,
"r_x3": 208.48,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.79,
"r_y0": 632.84,
"r_x1": 225.77,
"r_y1": 632.84,
"r_x2": 225.77,
"r_y2": 623.44,
"r_x3": 220.79,
"r_y3": 623.44,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 654.11,
"r_x1": 122.51,
"r_y1": 654.11,
"r_x2": 122.51,
"r_y2": 645.26,
"r_x3": 110.7,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.78,
"r_y0": 654.11,
"r_x1": 133.53,
"r_y1": 654.11,
"r_x2": 133.53,
"r_y2": 645.26,
"r_x3": 125.78,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 136.29,
"r_y0": 654.11,
"r_x1": 156.0,
"r_y1": 654.11,
"r_x2": 156.0,
"r_y2": 645.26,
"r_x3": 136.29,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "max",
"orig": "max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 654.11,
"r_x1": 160.98,
"r_y1": 654.11,
"r_x2": 160.98,
"r_y2": 644.7,
"r_x3": 156.0,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.98,
"r_y0": 654.11,
"r_x1": 170.24,
"r_y1": 654.11,
"r_x2": 170.24,
"r_y2": 645.26,
"r_x3": 160.98,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.74,
"r_y0": 654.11,
"r_x1": 185.68,
"r_y1": 654.11,
"r_x2": 185.68,
"r_y2": 644.7,
"r_x3": 170.74,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "} \u2212",
"orig": "} \u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.89,
"r_y0": 654.11,
"r_x1": 206.05,
"r_y1": 654.11,
"r_x2": 206.05,
"r_y2": 645.26,
"r_x3": 187.89,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "min",
"orig": "min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.05,
"r_y0": 654.11,
"r_x1": 211.04,
"r_y1": 654.11,
"r_x2": 211.04,
"r_y2": 644.7,
"r_x3": 206.05,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.03,
"r_y0": 654.11,
"r_x1": 220.29,
"r_y1": 654.11,
"r_x2": 220.29,
"r_y2": 645.26,
"r_x3": 211.03,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.79,
"r_y0": 654.11,
"r_x1": 225.77,
"r_y1": 654.11,
"r_x2": 225.77,
"r_y2": 644.7,
"r_x3": 220.79,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 643.79,
"r_x1": 286.36,
"r_y1": 643.79,
"r_x2": 286.36,
"r_y2": 634.89,
"r_x3": 274.75,
"r_y3": 634.89,
"coord_origin": "TOPLEFT"
},
"text": "(4)",
"orig": "(4)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 676.97,
"r_x1": 74.45,
"r_y1": 676.97,
"r_x2": 74.45,
"r_y2": 668.07,
"r_x3": 50.11,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.34,
"r_y0": 676.75,
"r_x1": 82.65,
"r_y1": 676.75,
"r_x2": 82.65,
"r_y2": 667.91,
"r_x3": 78.34,
"r_y3": 667.91,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.53,
"r_y0": 676.97,
"r_x1": 123.63,
"r_y1": 676.97,
"r_x2": 123.63,
"r_y2": 668.07,
"r_x3": 86.53,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "is one of",
"orig": "is one of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 127.52,
"r_y0": 676.75,
"r_x1": 132.5,
"r_y1": 676.75,
"r_x2": 132.5,
"r_y2": 667.35,
"r_x3": 127.52,
"r_y3": 667.35,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.5,
"r_y0": 676.97,
"r_x1": 210.7,
"r_y1": 676.97,
"r_x2": 210.7,
"r_y2": 668.07,
"r_x3": 132.5,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "left, centroid, right",
"orig": "left, centroid, right",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.7,
"r_y0": 676.75,
"r_x1": 215.68,
"r_y1": 676.75,
"r_x2": 215.68,
"r_y2": 667.35,
"r_x3": 210.7,
"r_y3": 667.35,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.56,
"r_y0": 676.97,
"r_x1": 233.95,
"r_y1": 676.97,
"r_x2": 233.95,
"r_y2": 668.07,
"r_x3": 219.56,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 237.83,
"r_y0": 676.75,
"r_x1": 247.09,
"r_y1": 676.75,
"r_x2": 247.09,
"r_y2": 667.91,
"r_x3": 237.83,
"r_y3": 667.91,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.47,
"r_y0": 676.97,
"r_x1": 286.36,
"r_y1": 676.97,
"r_x2": 286.36,
"r_y2": 668.07,
"r_x3": 251.47,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "is the x-",
"orig": "is the x-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 688.93,
"r_x1": 205.89,
"r_y1": 688.93,
"r_x2": 205.89,
"r_y2": 680.02,
"r_x3": 50.11,
"r_y3": 680.02,
"coord_origin": "TOPLEFT"
},
"text": "coordinate for the corresponding point.",
"orig": "coordinate for the corresponding point.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 701.2,
"r_x1": 69.54,
"r_y1": 701.2,
"r_x2": 69.54,
"r_y2": 692.29,
"r_x3": 62.07,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.27,
"r_y0": 701.2,
"r_x1": 286.36,
"r_y1": 701.2,
"r_x2": 286.36,
"r_y2": 692.29,
"r_x3": 76.27,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Use the alignment computed in step 4, to compute",
"orig": "Use the alignment computed in step 4, to compute",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 94.6,
"r_y1": 713.15,
"r_x2": 94.6,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "the median",
"orig": "the median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.6,
"r_y0": 712.93,
"r_x1": 103.29,
"r_y1": 712.93,
"r_x2": 103.29,
"r_y2": 704.09,
"r_x3": 97.6,
"r_y3": 704.09,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.29,
"r_y0": 713.15,
"r_x1": 286.36,
"r_y1": 713.15,
"r_x2": 286.36,
"r_y2": 704.25,
"r_x3": 103.29,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "-coordinate for all table columns and the me-",
"orig": "-coordinate for all table columns and the me-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 219.84,
"r_x1": 545.12,
"r_y1": 219.84,
"r_x2": 545.12,
"r_y2": 210.93,
"r_x3": 308.86,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "dian cell size for all table cells. The usage of median dur-",
"orig": "dian cell size for all table cells. The usage of median dur-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 231.79,
"r_x1": 545.12,
"r_y1": 231.79,
"r_x2": 545.12,
"r_y2": 222.89,
"r_x3": 308.86,
"r_y3": 222.89,
"coord_origin": "TOPLEFT"
},
"text": "ing the computations, helps to eliminate outliers caused by",
"orig": "ing the computations, helps to eliminate outliers caused by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 243.75,
"r_x1": 545.12,
"r_y1": 243.75,
"r_x2": 545.12,
"r_y2": 234.84,
"r_x3": 308.86,
"r_y3": 234.84,
"coord_origin": "TOPLEFT"
},
"text": "occasional column spans which are usually wider than the",
"orig": "occasional column spans which are usually wider than the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 255.7,
"r_x1": 339.58,
"r_y1": 255.7,
"r_x2": 339.58,
"r_y2": 246.8,
"r_x3": 308.86,
"r_y3": 246.8,
"coord_origin": "TOPLEFT"
},
"text": "normal.",
"orig": "normal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 268.01,
"r_x1": 328.29,
"r_y1": 268.01,
"r_x2": 328.29,
"r_y2": 259.1,
"r_x3": 320.82,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 334.88,
"r_y0": 268.01,
"r_x1": 545.11,
"r_y1": 268.01,
"r_x2": 545.11,
"r_y2": 259.1,
"r_x3": 334.88,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "Snap all cells with bad IOU to their corresponding",
"orig": "Snap all cells with bad IOU to their corresponding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 279.96,
"r_x1": 338.19,
"r_y1": 279.96,
"r_x2": 338.19,
"r_y2": 271.06,
"r_x3": 308.86,
"r_y3": 271.06,
"coord_origin": "TOPLEFT"
},
"text": "median",
"orig": "median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 340.68,
"r_y0": 279.74,
"r_x1": 346.38,
"r_y1": 279.74,
"r_x2": 346.38,
"r_y2": 270.9,
"r_x3": 340.68,
"r_y3": 270.9,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.38,
"r_y0": 279.96,
"r_x1": 453.72,
"r_y1": 279.96,
"r_x2": 453.72,
"r_y2": 271.06,
"r_x3": 346.38,
"r_y3": 271.06,
"coord_origin": "TOPLEFT"
},
"text": "-coordinates and cell sizes.",
"orig": "-coordinates and cell sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 292.27,
"r_x1": 328.39,
"r_y1": 292.27,
"r_x2": 328.39,
"r_y2": 283.36,
"r_x3": 320.82,
"r_y3": 283.36,
"coord_origin": "TOPLEFT"
},
"text": "7.",
"orig": "7.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.91,
"r_y0": 292.27,
"r_x1": 545.11,
"r_y1": 292.27,
"r_x2": 545.11,
"r_y2": 283.36,
"r_x3": 330.91,
"r_y3": 283.36,
"coord_origin": "TOPLEFT"
},
"text": "Generate a new set of pair-wise matches between the",
"orig": "Generate a new set of pair-wise matches between the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.22,
"r_x1": 545.12,
"r_y1": 304.22,
"r_x2": 545.12,
"r_y2": 295.32,
"r_x3": 308.86,
"r_y3": 295.32,
"coord_origin": "TOPLEFT"
},
"text": "corrected bounding boxes and PDF cells. This time use a",
"orig": "corrected bounding boxes and PDF cells. This time use a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.18,
"r_x1": 545.12,
"r_y1": 316.18,
"r_x2": 545.12,
"r_y2": 307.27,
"r_x3": 308.86,
"r_y3": 307.27,
"coord_origin": "TOPLEFT"
},
"text": "modified version of the IOU metric, where the area of the",
"orig": "modified version of the IOU metric, where the area of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 328.13,
"r_x1": 545.12,
"r_y1": 328.13,
"r_x2": 545.12,
"r_y2": 319.23,
"r_x3": 308.86,
"r_y3": 319.23,
"coord_origin": "TOPLEFT"
},
"text": "intersection between the predicted and PDF cells is divided",
"orig": "intersection between the predicted and PDF cells is divided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 340.09,
"r_x1": 397.19,
"r_y1": 340.09,
"r_x2": 397.19,
"r_y2": 331.18,
"r_x3": 308.86,
"r_y3": 331.18,
"coord_origin": "TOPLEFT"
},
"text": "by the PDF cell area.",
"orig": "by the PDF cell area.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.66,
"r_y0": 340.09,
"r_x1": 545.12,
"r_y1": 340.09,
"r_x2": 545.12,
"r_y2": 331.18,
"r_x3": 403.66,
"r_y3": 331.18,
"coord_origin": "TOPLEFT"
},
"text": "In case there are multiple matches",
"orig": "In case there are multiple matches",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 352.05,
"r_x1": 545.12,
"r_y1": 352.05,
"r_x2": 545.12,
"r_y2": 343.14,
"r_x3": 308.86,
"r_y3": 343.14,
"coord_origin": "TOPLEFT"
},
"text": "for the same PDF cell, the prediction with the higher score",
"orig": "for the same PDF cell, the prediction with the higher score",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 364.0,
"r_x1": 545.12,
"r_y1": 364.0,
"r_x2": 545.12,
"r_y2": 355.09,
"r_x3": 308.86,
"r_y3": 355.09,
"coord_origin": "TOPLEFT"
},
"text": "is preferred. This covers the cases where the PDF cells are",
"orig": "is preferred. This covers the cases where the PDF cells are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 375.96,
"r_x1": 545.12,
"r_y1": 375.96,
"r_x2": 545.12,
"r_y2": 367.05,
"r_x3": 308.86,
"r_y3": 367.05,
"coord_origin": "TOPLEFT"
},
"text": "smaller than the area of predicted or corrected prediction",
"orig": "smaller than the area of predicted or corrected prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 387.91,
"r_x1": 329.61,
"r_y1": 387.91,
"r_x2": 329.61,
"r_y2": 379.0,
"r_x3": 308.86,
"r_y3": 379.0,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 400.22,
"r_x1": 328.55,
"r_y1": 400.22,
"r_x2": 328.55,
"r_y2": 391.31,
"r_x3": 320.82,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "8.",
"orig": "8.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.13,
"r_y0": 400.22,
"r_x1": 545.12,
"r_y1": 400.22,
"r_x2": 545.12,
"r_y2": 391.31,
"r_x3": 331.13,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "In some rare occasions, we have noticed that Table-",
"orig": "In some rare occasions, we have noticed that Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.17,
"r_x1": 545.12,
"r_y1": 412.17,
"r_x2": 545.12,
"r_y2": 403.27,
"r_x3": 308.86,
"r_y3": 403.27,
"coord_origin": "TOPLEFT"
},
"text": "Former can confuse a single column as two. When the post-",
"orig": "Former can confuse a single column as two. When the post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.13,
"r_x1": 545.12,
"r_y1": 424.13,
"r_x2": 545.12,
"r_y2": 415.22,
"r_x3": 308.86,
"r_y3": 415.22,
"coord_origin": "TOPLEFT"
},
"text": "processing steps are applied, this results with two predicted",
"orig": "processing steps are applied, this results with two predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.08,
"r_x1": 545.12,
"r_y1": 436.08,
"r_x2": 545.12,
"r_y2": 427.18,
"r_x3": 308.86,
"r_y3": 427.18,
"coord_origin": "TOPLEFT"
},
"text": "columns pointing to the same PDF column. In such case",
"orig": "columns pointing to the same PDF column. In such case",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.04,
"r_x1": 545.12,
"r_y1": 448.04,
"r_x2": 545.12,
"r_y2": 439.13,
"r_x3": 308.86,
"r_y3": 439.13,
"coord_origin": "TOPLEFT"
},
"text": "we must de-duplicate the columns according to highest to-",
"orig": "we must de-duplicate the columns according to highest to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 459.99,
"r_x1": 426.18,
"r_y1": 459.99,
"r_x2": 426.18,
"r_y2": 451.09,
"r_x3": 308.86,
"r_y3": 451.09,
"coord_origin": "TOPLEFT"
},
"text": "tal column intersection score.",
"orig": "tal column intersection score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 472.3,
"r_x1": 328.67,
"r_y1": 472.3,
"r_x2": 328.67,
"r_y2": 463.39,
"r_x3": 320.82,
"r_y3": 463.39,
"coord_origin": "TOPLEFT"
},
"text": "9.",
"orig": "9.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.29,
"r_y0": 472.3,
"r_x1": 545.11,
"r_y1": 472.3,
"r_x2": 545.11,
"r_y2": 463.39,
"r_x3": 331.29,
"r_y3": 463.39,
"coord_origin": "TOPLEFT"
},
"text": "Pick up the remaining orphan cells. There could be",
"orig": "Pick up the remaining orphan cells. There could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 484.25,
"r_x1": 545.12,
"r_y1": 484.25,
"r_x2": 545.12,
"r_y2": 475.35,
"r_x3": 308.86,
"r_y3": 475.35,
"coord_origin": "TOPLEFT"
},
"text": "cases, when after applying all the previous post-processing",
"orig": "cases, when after applying all the previous post-processing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 496.21,
"r_x1": 545.12,
"r_y1": 496.21,
"r_x2": 545.12,
"r_y2": 487.3,
"r_x3": 308.86,
"r_y3": 487.3,
"coord_origin": "TOPLEFT"
},
"text": "steps, some PDF cells could still remain without any match",
"orig": "steps, some PDF cells could still remain without any match",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 508.16,
"r_x1": 381.9,
"r_y1": 508.16,
"r_x2": 381.9,
"r_y2": 499.26,
"r_x3": 308.86,
"r_y3": 499.26,
"coord_origin": "TOPLEFT"
},
"text": "to predicted cells.",
"orig": "to predicted cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 508.16,
"r_x1": 545.12,
"r_y1": 508.16,
"r_x2": 545.12,
"r_y2": 499.26,
"r_x3": 388.7,
"r_y3": 499.26,
"coord_origin": "TOPLEFT"
},
"text": "However, it is still possible to deduce",
"orig": "However, it is still possible to deduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 520.12,
"r_x1": 545.12,
"r_y1": 520.12,
"r_x2": 545.12,
"r_y2": 511.21,
"r_x3": 308.86,
"r_y3": 511.21,
"coord_origin": "TOPLEFT"
},
"text": "the correct matching for an orphan PDF cell by mapping its",
"orig": "the correct matching for an orphan PDF cell by mapping its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 532.07,
"r_x1": 545.12,
"r_y1": 532.07,
"r_x2": 545.12,
"r_y2": 523.17,
"r_x3": 308.86,
"r_y3": 523.17,
"coord_origin": "TOPLEFT"
},
"text": "bounding box on the geometry of the grid. This mapping",
"orig": "bounding box on the geometry of the grid. This mapping",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 544.03,
"r_x1": 545.11,
"r_y1": 544.03,
"r_x2": 545.11,
"r_y2": 535.12,
"r_x3": 308.86,
"r_y3": 535.12,
"coord_origin": "TOPLEFT"
},
"text": "decides if the content of the orphan cell will be appended to",
"orig": "decides if the content of the orphan cell will be appended to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 555.98,
"r_x1": 545.12,
"r_y1": 555.98,
"r_x2": 545.12,
"r_y2": 547.08,
"r_x3": 308.86,
"r_y3": 547.08,
"coord_origin": "TOPLEFT"
},
"text": "an already matched table cell, or a new table cell should be",
"orig": "an already matched table cell, or a new table cell should be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 567.94,
"r_x1": 442.22,
"r_y1": 567.94,
"r_x2": 442.22,
"r_y2": 559.03,
"r_x3": 308.86,
"r_y3": 559.03,
"coord_origin": "TOPLEFT"
},
"text": "created to match with the orphan.",
"orig": "created to match with the orphan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 580.24,
"r_x1": 545.11,
"r_y1": 580.24,
"r_x2": 545.11,
"r_y2": 571.34,
"r_x3": 320.82,
"r_y3": 571.34,
"coord_origin": "TOPLEFT"
},
"text": "9a. Compute the top and bottom boundary of the hori-",
"orig": "9a. Compute the top and bottom boundary of the hori-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 592.2,
"r_x1": 471.64,
"r_y1": 592.2,
"r_x2": 471.64,
"r_y2": 583.29,
"r_x3": 308.86,
"r_y3": 583.29,
"coord_origin": "TOPLEFT"
},
"text": "zontal band for each grid row (min/max",
"orig": "zontal band for each grid row (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.83,
"r_y0": 591.98,
"r_x1": 479.72,
"r_y1": 591.98,
"r_x2": 479.72,
"r_y2": 583.13,
"r_x3": 474.83,
"r_y3": 583.13,
"coord_origin": "TOPLEFT"
},
"text": "y",
"orig": "y",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.27,
"r_y0": 592.2,
"r_x1": 545.12,
"r_y1": 592.2,
"r_x2": 545.12,
"r_y2": 583.29,
"r_x3": 483.27,
"r_y3": 583.29,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per",
"orig": "coordinates per",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 604.15,
"r_x1": 329.91,
"r_y1": 604.15,
"r_x2": 329.91,
"r_y2": 595.25,
"r_x3": 308.86,
"r_y3": 595.25,
"coord_origin": "TOPLEFT"
},
"text": "row).",
"orig": "row).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 616.46,
"r_x1": 332.87,
"r_y1": 616.46,
"r_x2": 332.87,
"r_y2": 607.55,
"r_x3": 320.82,
"r_y3": 607.55,
"coord_origin": "TOPLEFT"
},
"text": "9b.",
"orig": "9b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.93,
"r_y0": 616.46,
"r_x1": 545.12,
"r_y1": 616.46,
"r_x2": 545.12,
"r_y2": 607.55,
"r_x3": 339.93,
"r_y3": 607.55,
"coord_origin": "TOPLEFT"
},
"text": "Intersect the orphan\u2019s bounding box with the row",
"orig": "Intersect the orphan\u2019s bounding box with the row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 628.42,
"r_x1": 495.29,
"r_y1": 628.42,
"r_x2": 495.29,
"r_y2": 619.51,
"r_x3": 308.86,
"r_y3": 619.51,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid row.",
"orig": "bands, and map the cell to the closest grid row.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 640.72,
"r_x1": 545.12,
"r_y1": 640.72,
"r_x2": 545.12,
"r_y2": 631.81,
"r_x3": 320.82,
"r_y3": 631.81,
"coord_origin": "TOPLEFT"
},
"text": "9c. Compute the left and right boundary of the vertical",
"orig": "9c. Compute the left and right boundary of the vertical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 652.68,
"r_x1": 455.28,
"r_y1": 652.68,
"r_x2": 455.28,
"r_y2": 643.77,
"r_x3": 308.86,
"r_y3": 643.77,
"coord_origin": "TOPLEFT"
},
"text": "band for each grid column (min/max",
"orig": "band for each grid column (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 457.78,
"r_y0": 652.46,
"r_x1": 463.47,
"r_y1": 652.46,
"r_x2": 463.47,
"r_y2": 643.61,
"r_x3": 457.78,
"r_y3": 643.61,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.97,
"r_y0": 652.68,
"r_x1": 545.11,
"r_y1": 652.68,
"r_x2": 545.11,
"r_y2": 643.77,
"r_x3": 465.97,
"r_y3": 643.77,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per col-",
"orig": "coordinates per col-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 664.63,
"r_x1": 332.38,
"r_y1": 664.63,
"r_x2": 332.38,
"r_y2": 655.72,
"r_x3": 308.86,
"r_y3": 655.72,
"coord_origin": "TOPLEFT"
},
"text": "umn).",
"orig": "umn).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 676.94,
"r_x1": 545.11,
"r_y1": 676.94,
"r_x2": 545.11,
"r_y2": 668.03,
"r_x3": 320.82,
"r_y3": 668.03,
"coord_origin": "TOPLEFT"
},
"text": "9d. Intersect the orphan\u2019s bounding box with the column",
"orig": "9d. Intersect the orphan\u2019s bounding box with the column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 688.89,
"r_x1": 510.58,
"r_y1": 688.89,
"r_x2": 510.58,
"r_y2": 679.99,
"r_x3": 308.86,
"r_y3": 679.99,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid column.",
"orig": "bands, and map the cell to the closest grid column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 320.82,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "9e. If the table cell under the identified row and column",
"orig": "9e. If the table cell under the identified row and column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "is not empty, extend its content with the content of the or-",
"orig": "is not empty, extend its content with the content of the or-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 30,
"label": "picture",
"bbox": {
"l": 53.54,
"t": 74.75,
"r": 544.94,
"b": 147.59,
"coord_origin": "TOPLEFT"
},
"confidence": 0.603,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.39,
"r_y0": 83.26,
"r_x1": 151.95,
"r_y1": 83.26,
"r_x2": 151.95,
"r_y2": 77.31,
"r_x3": 119.39,
"r_y3": 77.31,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.35,
"r_y0": 81.14,
"r_x1": 59.33,
"r_y1": 81.14,
"r_x2": 59.33,
"r_y2": 75.19,
"r_x3": 53.35,
"r_y3": 75.19,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.58,
"r_y0": 83.41,
"r_x1": 319.83,
"r_y1": 83.41,
"r_x2": 319.83,
"r_y2": 77.46,
"r_x3": 289.58,
"r_y3": 77.46,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.37,
"r_y0": 83.2,
"r_x1": 481.76,
"r_y1": 83.2,
"r_x2": 481.76,
"r_y2": 77.25,
"r_x3": 448.37,
"r_y3": 77.25,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.55,
"r_y0": 146.23,
"r_x1": 94.98,
"r_y1": 146.23,
"r_x2": 94.98,
"r_y2": 141.28,
"r_x3": 82.55,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.04,
"r_y0": 106.06,
"r_x1": 85.29,
"r_y1": 106.06,
"r_x2": 85.29,
"r_y2": 101.1,
"r_x3": 63.04,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 129.35,
"r_x1": 85.23,
"r_y1": 129.35,
"r_x2": 85.23,
"r_y2": 124.4,
"r_x3": 67.77,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.55,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.54,
"r_x3": 227.55,
"r_y3": 102.54,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.94,
"r_x1": 249.66,
"r_y1": 131.94,
"r_x2": 249.66,
"r_y2": 126.99,
"r_x3": 232.2,
"r_y3": 126.99,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.23,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.05,
"r_x3": 396.23,
"r_y3": 114.05,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.38,
"r_y0": 146.23,
"r_x1": 105.08,
"r_y1": 146.23,
"r_x2": 105.08,
"r_y2": 141.28,
"r_x3": 97.38,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.94,
"r_y0": 90.69,
"r_x1": 76.15,
"r_y1": 90.69,
"r_x2": 76.15,
"r_y2": 85.73,
"r_x3": 60.94,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.18,
"r_x1": 106.99,
"r_y1": 91.18,
"r_x2": 106.99,
"r_y2": 86.22,
"r_x3": 82.3,
"r_y3": 86.22,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.21,
"r_y0": 146.56,
"r_x1": 281.88,
"r_y1": 146.56,
"r_x2": 281.88,
"r_y2": 141.61,
"r_x3": 246.21,
"r_y3": 141.61,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.69,
"r_x1": 241.91,
"r_y1": 90.69,
"r_x2": 241.91,
"r_y2": 85.73,
"r_x3": 226.7,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.94,
"r_y0": 91.05,
"r_x1": 282.49,
"r_y1": 91.05,
"r_x2": 282.49,
"r_y2": 86.09,
"r_x3": 249.94,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.19,
"r_y0": 146.23,
"r_x1": 444.69,
"r_y1": 146.23,
"r_x2": 444.69,
"r_y2": 141.28,
"r_x3": 410.19,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 90.69,
"r_x1": 432.67,
"r_y1": 90.69,
"r_x2": 432.67,
"r_y2": 85.73,
"r_x3": 391.37,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.61,
"r_y0": 91.22,
"r_x1": 445.62,
"r_y1": 91.22,
"r_x2": 445.62,
"r_y2": 86.26,
"r_x3": 435.61,
"r_y3": 86.26,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.95,
"r_y0": 146.25,
"r_x1": 136.2,
"r_y1": 146.25,
"r_x2": 136.2,
"r_y2": 141.29,
"r_x3": 113.95,
"r_y3": 141.29,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.92,
"r_y0": 99.78,
"r_x1": 127.05,
"r_y1": 99.78,
"r_x2": 127.05,
"r_y2": 94.82,
"r_x3": 116.92,
"r_y3": 94.82,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.31,
"r_y0": 105.9,
"r_x1": 127.05,
"r_y1": 105.9,
"r_x2": 127.05,
"r_y2": 100.94,
"r_x3": 113.31,
"r_y3": 100.94,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.94,
"r_y0": 112.02,
"r_x1": 127.06,
"r_y1": 112.02,
"r_x2": 127.06,
"r_y2": 107.06,
"r_x3": 112.94,
"r_y3": 107.06,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.23,
"r_y0": 127.57,
"r_x1": 126.97,
"r_y1": 127.57,
"r_x2": 126.97,
"r_y2": 122.62,
"r_x3": 113.23,
"r_y3": 122.62,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.85,
"r_y0": 133.69,
"r_x1": 126.97,
"r_y1": 133.69,
"r_x2": 126.97,
"r_y2": 128.74,
"r_x3": 112.85,
"r_y3": 128.74,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.58,
"r_y0": 146.39,
"r_x1": 156.04,
"r_y1": 146.39,
"r_x2": 156.04,
"r_y2": 141.44,
"r_x3": 138.58,
"r_y3": 141.44,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.03,
"r_y0": 91.23,
"r_x1": 151.04,
"r_y1": 91.23,
"r_x2": 151.04,
"r_y2": 86.27,
"r_x3": 122.03,
"r_y3": 86.27,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.65,
"r_y0": 91.51,
"r_x1": 321.67,
"r_y1": 91.51,
"r_x2": 321.67,
"r_y2": 86.55,
"r_x3": 311.65,
"r_y3": 86.55,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.89,
"r_y0": 146.67,
"r_x1": 310.15,
"r_y1": 146.67,
"r_x2": 310.15,
"r_y2": 141.71,
"r_x3": 287.89,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.24,
"r_y0": 98.04,
"r_x1": 299.37,
"r_y1": 98.04,
"r_x2": 299.37,
"r_y2": 93.08,
"r_x3": 289.24,
"r_y3": 93.08,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.64,
"r_y0": 104.16,
"r_x1": 299.37,
"r_y1": 104.16,
"r_x2": 299.37,
"r_y2": 99.2,
"r_x3": 285.64,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.26,
"r_y0": 110.28,
"r_x1": 299.38,
"r_y1": 110.28,
"r_x2": 299.38,
"r_y2": 105.32,
"r_x3": 285.26,
"r_y3": 105.32,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.43,
"r_y0": 125.35,
"r_x1": 299.17,
"r_y1": 125.35,
"r_x2": 299.17,
"r_y2": 120.39,
"r_x3": 285.43,
"r_y3": 120.39,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.06,
"r_y0": 131.47,
"r_x1": 299.17,
"r_y1": 131.47,
"r_x2": 299.17,
"r_y2": 126.51,
"r_x3": 285.06,
"r_y3": 126.51,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.35,
"r_y0": 146.67,
"r_x1": 328.81,
"r_y1": 146.67,
"r_x2": 328.81,
"r_y2": 141.71,
"r_x3": 311.35,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.58,
"r_y0": 91.65,
"r_x1": 309.6,
"r_y1": 91.65,
"r_x2": 309.6,
"r_y2": 86.69,
"r_x3": 299.58,
"r_y3": 86.69,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.04,
"r_y0": 146.63,
"r_x1": 483.5,
"r_y1": 146.63,
"r_x2": 483.5,
"r_y2": 141.67,
"r_x3": 466.04,
"r_y3": 141.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.02,
"r_y0": 98.72,
"r_x1": 469.16,
"r_y1": 98.72,
"r_x2": 469.16,
"r_y2": 93.76,
"r_x3": 459.02,
"r_y3": 93.76,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.42,
"r_y0": 104.84,
"r_x1": 469.16,
"r_y1": 104.84,
"r_x2": 469.16,
"r_y2": 99.88,
"r_x3": 455.42,
"r_y3": 99.88,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.05,
"r_y0": 110.96,
"r_x1": 469.16,
"r_y1": 110.96,
"r_x2": 469.16,
"r_y2": 106.0,
"r_x3": 455.05,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.39,
"r_y0": 90.53,
"r_x1": 480.65,
"r_y1": 90.53,
"r_x2": 480.65,
"r_y2": 85.57,
"r_x3": 467.39,
"r_y3": 85.57,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.38,
"r_y0": 146.54,
"r_x1": 182.63,
"r_y1": 146.54,
"r_x2": 182.63,
"r_y2": 141.58,
"r_x3": 160.38,
"r_y3": 141.58,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.74,
"r_y0": 99.82,
"r_x1": 173.33,
"r_y1": 99.82,
"r_x2": 173.33,
"r_y2": 94.86,
"r_x3": 153.74,
"r_y3": 94.86,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.51,
"r_y0": 105.94,
"r_x1": 173.32,
"r_y1": 105.94,
"r_x2": 173.32,
"r_y2": 100.98,
"r_x3": 154.51,
"r_y3": 100.98,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.27,
"r_y0": 112.06,
"r_x1": 173.33,
"r_y1": 112.06,
"r_x2": 173.33,
"r_y2": 107.1,
"r_x3": 155.27,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.41,
"r_y0": 112.19,
"r_x1": 346.0,
"r_y1": 112.19,
"r_x2": 346.0,
"r_y2": 107.23,
"r_x3": 326.41,
"r_y3": 107.23,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.18,
"r_y0": 118.31,
"r_x1": 345.99,
"r_y1": 118.31,
"r_x2": 345.99,
"r_y2": 113.35,
"r_x3": 327.18,
"r_y3": 113.35,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.94,
"r_y0": 124.43,
"r_x1": 346.0,
"r_y1": 124.43,
"r_x2": 346.0,
"r_y2": 119.47,
"r_x3": 327.94,
"r_y3": 119.47,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.99,
"r_y0": 109.11,
"r_x1": 508.76,
"r_y1": 109.11,
"r_x2": 508.76,
"r_y2": 104.15,
"r_x3": 488.99,
"r_y3": 104.15,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.19,
"r_y0": 115.23,
"r_x1": 508.76,
"r_y1": 115.23,
"r_x2": 508.76,
"r_y2": 110.27,
"r_x3": 490.19,
"r_y3": 110.27,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.72,
"r_y0": 121.35,
"r_x1": 508.77,
"r_y1": 121.35,
"r_x2": 508.77,
"r_y2": 116.39,
"r_x3": 489.72,
"r_y3": 116.39,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.71,
"r_y0": 127.47,
"r_x1": 508.77,
"r_y1": 127.47,
"r_x2": 508.77,
"r_y2": 122.51,
"r_x3": 490.71,
"r_y3": 122.51,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.38,
"r_y0": 146.67,
"r_x1": 202.84,
"r_y1": 146.67,
"r_x2": 202.84,
"r_y2": 141.71,
"r_x3": 185.38,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.09,
"r_x1": 197.53,
"r_y1": 91.09,
"r_x2": 197.53,
"r_y2": 86.14,
"r_x3": 168.5,
"r_y3": 86.14,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.38,
"r_y0": 90.95,
"r_x1": 367.4,
"r_y1": 90.95,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.38,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.73,
"r_y0": 146.58,
"r_x1": 374.93,
"r_y1": 146.58,
"r_x2": 374.93,
"r_y2": 141.62,
"r_x3": 333.73,
"r_y3": 141.62,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.69,
"r_y0": 91.01,
"r_x1": 355.71,
"r_y1": 91.01,
"r_x2": 355.71,
"r_y2": 86.06,
"r_x3": 345.69,
"r_y3": 86.06,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.54,
"r_y0": 146.33,
"r_x1": 526.01,
"r_y1": 146.33,
"r_x2": 526.01,
"r_y2": 141.38,
"r_x3": 508.54,
"r_y3": 141.38,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.45,
"r_y0": 91.05,
"r_x1": 523.71,
"r_y1": 91.05,
"r_x2": 523.71,
"r_y2": 86.09,
"r_x3": 510.45,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 46,
"label": "text",
"bbox": {
"l": 119.39,
"t": 77.31,
"r": 151.95,
"b": 83.26,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.39,
"r_y0": 83.26,
"r_x1": 151.95,
"r_y1": 83.26,
"r_x2": 151.95,
"r_y2": 77.31,
"r_x3": 119.39,
"r_y3": 77.31,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 53.35,
"t": 75.19,
"r": 59.33,
"b": 81.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.35,
"r_y0": 81.14,
"r_x1": 59.33,
"r_y1": 81.14,
"r_x2": 59.33,
"r_y2": 75.19,
"r_x3": 53.35,
"r_y3": 75.19,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 289.58,
"t": 77.46,
"r": 319.83,
"b": 83.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.58,
"r_y0": 83.41,
"r_x1": 319.83,
"r_y1": 83.41,
"r_x2": 319.83,
"r_y2": 77.46,
"r_x3": 289.58,
"r_y3": 77.46,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 448.37,
"t": 77.25,
"r": 481.76,
"b": 83.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.37,
"r_y0": 83.2,
"r_x1": 481.76,
"r_y1": 83.2,
"r_x2": 481.76,
"r_y2": 77.25,
"r_x3": 448.37,
"r_y3": 77.25,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 82.55,
"t": 141.28,
"r": 94.98,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.55,
"r_y0": 146.23,
"r_x1": 94.98,
"r_y1": 146.23,
"r_x2": 94.98,
"r_y2": 141.28,
"r_x3": 82.55,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 63.04,
"t": 101.1,
"r": 85.29,
"b": 106.06,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.04,
"r_y0": 106.06,
"r_x1": 85.29,
"r_y1": 106.06,
"r_x2": 85.29,
"r_y2": 101.1,
"r_x3": 63.04,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 67.77,
"t": 124.4,
"r": 85.23,
"b": 129.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 129.35,
"r_x1": 85.23,
"r_y1": 129.35,
"r_x2": 85.23,
"r_y2": 124.4,
"r_x3": 67.77,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 227.55,
"t": 102.54,
"r": 249.8,
"b": 107.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.55,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.54,
"r_x3": 227.55,
"r_y3": 102.54,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 232.2,
"t": 126.99,
"r": 249.66,
"b": 131.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.94,
"r_x1": 249.66,
"r_y1": 131.94,
"r_x2": 249.66,
"r_y2": 126.99,
"r_x3": 232.2,
"r_y3": 126.99,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 396.23,
"t": 114.05,
"r": 413.7,
"b": 119.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.23,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.05,
"r_x3": 396.23,
"r_y3": 114.05,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 97.38,
"t": 141.28,
"r": 105.08,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.38,
"r_y0": 146.23,
"r_x1": 105.08,
"r_y1": 146.23,
"r_x2": 105.08,
"r_y2": 141.28,
"r_x3": 97.38,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 60.94,
"t": 85.73,
"r": 76.15,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.94,
"r_y0": 90.69,
"r_x1": 76.15,
"r_y1": 90.69,
"r_x2": 76.15,
"r_y2": 85.73,
"r_x3": 60.94,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 82.3,
"t": 86.22,
"r": 106.99,
"b": 91.18,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.18,
"r_x1": 106.99,
"r_y1": 91.18,
"r_x2": 106.99,
"r_y2": 86.22,
"r_x3": 82.3,
"r_y3": 86.22,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 246.21,
"t": 141.61,
"r": 281.88,
"b": 146.56,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.21,
"r_y0": 146.56,
"r_x1": 281.88,
"r_y1": 146.56,
"r_x2": 281.88,
"r_y2": 141.61,
"r_x3": 246.21,
"r_y3": 141.61,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 226.7,
"t": 85.73,
"r": 241.91,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.69,
"r_x1": 241.91,
"r_y1": 90.69,
"r_x2": 241.91,
"r_y2": 85.73,
"r_x3": 226.7,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 249.94,
"t": 86.09,
"r": 282.49,
"b": 91.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.94,
"r_y0": 91.05,
"r_x1": 282.49,
"r_y1": 91.05,
"r_x2": 282.49,
"r_y2": 86.09,
"r_x3": 249.94,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 410.19,
"t": 141.28,
"r": 444.69,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.19,
"r_y0": 146.23,
"r_x1": 444.69,
"r_y1": 146.23,
"r_x2": 444.69,
"r_y2": 141.28,
"r_x3": 410.19,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 391.37,
"t": 85.73,
"r": 432.67,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 90.69,
"r_x1": 432.67,
"r_y1": 90.69,
"r_x2": 432.67,
"r_y2": 85.73,
"r_x3": 391.37,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 435.61,
"t": 86.26,
"r": 445.62,
"b": 91.22,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.61,
"r_y0": 91.22,
"r_x1": 445.62,
"r_y1": 91.22,
"r_x2": 445.62,
"r_y2": 86.26,
"r_x3": 435.61,
"r_y3": 86.26,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 113.95,
"t": 141.29,
"r": 136.2,
"b": 146.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.95,
"r_y0": 146.25,
"r_x1": 136.2,
"r_y1": 146.25,
"r_x2": 136.2,
"r_y2": 141.29,
"r_x3": 113.95,
"r_y3": 141.29,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 116.92,
"t": 94.82,
"r": 127.05,
"b": 99.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.92,
"r_y0": 99.78,
"r_x1": 127.05,
"r_y1": 99.78,
"r_x2": 127.05,
"r_y2": 94.82,
"r_x3": 116.92,
"r_y3": 94.82,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 113.31,
"t": 100.94,
"r": 127.05,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.31,
"r_y0": 105.9,
"r_x1": 127.05,
"r_y1": 105.9,
"r_x2": 127.05,
"r_y2": 100.94,
"r_x3": 113.31,
"r_y3": 100.94,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 112.94,
"t": 107.06,
"r": 127.06,
"b": 112.02,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.94,
"r_y0": 112.02,
"r_x1": 127.06,
"r_y1": 112.02,
"r_x2": 127.06,
"r_y2": 107.06,
"r_x3": 112.94,
"r_y3": 107.06,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 113.23,
"t": 122.62,
"r": 126.97,
"b": 127.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.23,
"r_y0": 127.57,
"r_x1": 126.97,
"r_y1": 127.57,
"r_x2": 126.97,
"r_y2": 122.62,
"r_x3": 113.23,
"r_y3": 122.62,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 112.85,
"t": 128.74,
"r": 126.97,
"b": 133.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.85,
"r_y0": 133.69,
"r_x1": 126.97,
"r_y1": 133.69,
"r_x2": 126.97,
"r_y2": 128.74,
"r_x3": 112.85,
"r_y3": 128.74,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 138.58,
"t": 141.44,
"r": 156.04,
"b": 146.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.58,
"r_y0": 146.39,
"r_x1": 156.04,
"r_y1": 146.39,
"r_x2": 156.04,
"r_y2": 141.44,
"r_x3": 138.58,
"r_y3": 141.44,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 122.03,
"t": 86.27,
"r": 151.04,
"b": 91.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.03,
"r_y0": 91.23,
"r_x1": 151.04,
"r_y1": 91.23,
"r_x2": 151.04,
"r_y2": 86.27,
"r_x3": 122.03,
"r_y3": 86.27,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 311.65,
"t": 86.55,
"r": 321.67,
"b": 91.51,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.65,
"r_y0": 91.51,
"r_x1": 321.67,
"r_y1": 91.51,
"r_x2": 321.67,
"r_y2": 86.55,
"r_x3": 311.65,
"r_y3": 86.55,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 287.89,
"t": 141.71,
"r": 310.15,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.89,
"r_y0": 146.67,
"r_x1": 310.15,
"r_y1": 146.67,
"r_x2": 310.15,
"r_y2": 141.71,
"r_x3": 287.89,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 289.24,
"t": 93.08,
"r": 299.37,
"b": 98.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.24,
"r_y0": 98.04,
"r_x1": 299.37,
"r_y1": 98.04,
"r_x2": 299.37,
"r_y2": 93.08,
"r_x3": 289.24,
"r_y3": 93.08,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 285.64,
"t": 99.2,
"r": 299.37,
"b": 104.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.64,
"r_y0": 104.16,
"r_x1": 299.37,
"r_y1": 104.16,
"r_x2": 299.37,
"r_y2": 99.2,
"r_x3": 285.64,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 285.26,
"t": 105.32,
"r": 299.38,
"b": 110.28,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.26,
"r_y0": 110.28,
"r_x1": 299.38,
"r_y1": 110.28,
"r_x2": 299.38,
"r_y2": 105.32,
"r_x3": 285.26,
"r_y3": 105.32,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 285.43,
"t": 120.39,
"r": 299.17,
"b": 125.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.43,
"r_y0": 125.35,
"r_x1": 299.17,
"r_y1": 125.35,
"r_x2": 299.17,
"r_y2": 120.39,
"r_x3": 285.43,
"r_y3": 120.39,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 285.06,
"t": 126.51,
"r": 299.17,
"b": 131.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.06,
"r_y0": 131.47,
"r_x1": 299.17,
"r_y1": 131.47,
"r_x2": 299.17,
"r_y2": 126.51,
"r_x3": 285.06,
"r_y3": 126.51,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 311.35,
"t": 141.71,
"r": 328.81,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.35,
"r_y0": 146.67,
"r_x1": 328.81,
"r_y1": 146.67,
"r_x2": 328.81,
"r_y2": 141.71,
"r_x3": 311.35,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 299.58,
"t": 86.69,
"r": 309.6,
"b": 91.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.58,
"r_y0": 91.65,
"r_x1": 309.6,
"r_y1": 91.65,
"r_x2": 309.6,
"r_y2": 86.69,
"r_x3": 299.58,
"r_y3": 86.69,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 466.04,
"t": 141.67,
"r": 483.5,
"b": 146.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.04,
"r_y0": 146.63,
"r_x1": 483.5,
"r_y1": 146.63,
"r_x2": 483.5,
"r_y2": 141.67,
"r_x3": 466.04,
"r_y3": 141.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 459.02,
"t": 93.76,
"r": 469.16,
"b": 98.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.02,
"r_y0": 98.72,
"r_x1": 469.16,
"r_y1": 98.72,
"r_x2": 469.16,
"r_y2": 93.76,
"r_x3": 459.02,
"r_y3": 93.76,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 455.42,
"t": 99.88,
"r": 469.16,
"b": 104.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.42,
"r_y0": 104.84,
"r_x1": 469.16,
"r_y1": 104.84,
"r_x2": 469.16,
"r_y2": 99.88,
"r_x3": 455.42,
"r_y3": 99.88,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 455.05,
"t": 106.0,
"r": 469.16,
"b": 110.96,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.05,
"r_y0": 110.96,
"r_x1": 469.16,
"r_y1": 110.96,
"r_x2": 469.16,
"r_y2": 106.0,
"r_x3": 455.05,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 467.39,
"t": 85.57,
"r": 480.65,
"b": 90.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.39,
"r_y0": 90.53,
"r_x1": 480.65,
"r_y1": 90.53,
"r_x2": 480.65,
"r_y2": 85.57,
"r_x3": 467.39,
"r_y3": 85.57,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 160.38,
"t": 141.58,
"r": 182.63,
"b": 146.54,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.38,
"r_y0": 146.54,
"r_x1": 182.63,
"r_y1": 146.54,
"r_x2": 182.63,
"r_y2": 141.58,
"r_x3": 160.38,
"r_y3": 141.58,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 153.74,
"t": 94.86,
"r": 173.33,
"b": 99.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.74,
"r_y0": 99.82,
"r_x1": 173.33,
"r_y1": 99.82,
"r_x2": 173.33,
"r_y2": 94.86,
"r_x3": 153.74,
"r_y3": 94.86,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 154.51,
"t": 100.98,
"r": 173.32,
"b": 105.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.51,
"r_y0": 105.94,
"r_x1": 173.32,
"r_y1": 105.94,
"r_x2": 173.32,
"r_y2": 100.98,
"r_x3": 154.51,
"r_y3": 100.98,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 155.27,
"t": 107.1,
"r": 173.33,
"b": 112.06,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.27,
"r_y0": 112.06,
"r_x1": 173.33,
"r_y1": 112.06,
"r_x2": 173.33,
"r_y2": 107.1,
"r_x3": 155.27,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.41,
"t": 107.23,
"r": 346.0,
"b": 112.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.41,
"r_y0": 112.19,
"r_x1": 346.0,
"r_y1": 112.19,
"r_x2": 346.0,
"r_y2": 107.23,
"r_x3": 326.41,
"r_y3": 107.23,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 327.18,
"t": 113.35,
"r": 345.99,
"b": 118.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.18,
"r_y0": 118.31,
"r_x1": 345.99,
"r_y1": 118.31,
"r_x2": 345.99,
"r_y2": 113.35,
"r_x3": 327.18,
"r_y3": 113.35,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 327.94,
"t": 119.47,
"r": 346.0,
"b": 124.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.94,
"r_y0": 124.43,
"r_x1": 346.0,
"r_y1": 124.43,
"r_x2": 346.0,
"r_y2": 119.47,
"r_x3": 327.94,
"r_y3": 119.47,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 488.99,
"t": 104.15,
"r": 508.76,
"b": 109.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.99,
"r_y0": 109.11,
"r_x1": 508.76,
"r_y1": 109.11,
"r_x2": 508.76,
"r_y2": 104.15,
"r_x3": 488.99,
"r_y3": 104.15,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 490.19,
"t": 110.27,
"r": 508.76,
"b": 115.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.19,
"r_y0": 115.23,
"r_x1": 508.76,
"r_y1": 115.23,
"r_x2": 508.76,
"r_y2": 110.27,
"r_x3": 490.19,
"r_y3": 110.27,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 489.72,
"t": 116.39,
"r": 508.77,
"b": 121.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.72,
"r_y0": 121.35,
"r_x1": 508.77,
"r_y1": 121.35,
"r_x2": 508.77,
"r_y2": 116.39,
"r_x3": 489.72,
"r_y3": 116.39,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 490.71,
"t": 122.51,
"r": 508.77,
"b": 127.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.71,
"r_y0": 127.47,
"r_x1": 508.77,
"r_y1": 127.47,
"r_x2": 508.77,
"r_y2": 122.51,
"r_x3": 490.71,
"r_y3": 122.51,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 185.38,
"t": 141.71,
"r": 202.84,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.38,
"r_y0": 146.67,
"r_x1": 202.84,
"r_y1": 146.67,
"r_x2": 202.84,
"r_y2": 141.71,
"r_x3": 185.38,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 168.5,
"t": 86.14,
"r": 197.53,
"b": 91.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.09,
"r_x1": 197.53,
"r_y1": 91.09,
"r_x2": 197.53,
"r_y2": 86.14,
"r_x3": 168.5,
"r_y3": 86.14,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 357.38,
"t": 86.0,
"r": 367.4,
"b": 90.95,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.38,
"r_y0": 90.95,
"r_x1": 367.4,
"r_y1": 90.95,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.38,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 333.73,
"t": 141.62,
"r": 374.93,
"b": 146.58,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.73,
"r_y0": 146.58,
"r_x1": 374.93,
"r_y1": 146.58,
"r_x2": 374.93,
"r_y2": 141.62,
"r_x3": 333.73,
"r_y3": 141.62,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 345.69,
"t": 86.06,
"r": 355.71,
"b": 91.01,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.69,
"r_y0": 91.01,
"r_x1": 355.71,
"r_y1": 91.01,
"r_x2": 355.71,
"r_y2": 86.06,
"r_x3": 345.69,
"r_y3": 86.06,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 508.54,
"t": 141.38,
"r": 526.01,
"b": 146.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.54,
"r_y0": 146.33,
"r_x1": 526.01,
"r_y1": 146.33,
"r_x2": 526.01,
"r_y2": 141.38,
"r_x3": 508.54,
"r_y3": 141.38,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 510.45,
"t": 86.09,
"r": 523.71,
"b": 91.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.45,
"r_y0": 91.05,
"r_x1": 523.71,
"r_y1": 91.05,
"r_x2": 523.71,
"r_y2": 86.09,
"r_x3": 510.45,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 1,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 165.5,
"r": 545.11,
"b": 186.36,
"coord_origin": "TOPLEFT"
},
"confidence": 0.966,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 174.41,
"r_x1": 545.11,
"r_y1": 174.41,
"r_x2": 545.11,
"r_y2": 165.5,
"r_x3": 50.11,
"r_y3": 165.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 186.36,
"r_x1": 513.52,
"r_y1": 186.36,
"r_x2": 513.52,
"r_y2": 177.46,
"r_x3": 50.11,
"r_y3": 177.46,
"coord_origin": "TOPLEFT"
},
"text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 210.93,
"r": 286.37,
"b": 231.79,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 219.84,
"r_x1": 71.15,
"r_y1": 219.84,
"r_x2": 71.15,
"r_y2": 210.93,
"r_x3": 61.57,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.54,
"r_y0": 219.84,
"r_x1": 286.37,
"r_y1": 219.84,
"r_x2": 286.37,
"r_y2": 210.93,
"r_x3": 73.54,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer output does not include the table cell con-",
"orig": "TableFormer output does not include the table cell con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 231.79,
"r_x1": 87.47,
"r_y1": 231.79,
"r_x2": 87.47,
"r_y2": 222.89,
"r_x3": 70.04,
"r_y3": 222.89,
"coord_origin": "TOPLEFT"
},
"text": "tent.",
"orig": "tent.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 244.07,
"r": 286.37,
"b": 264.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.963,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 252.98,
"r_x1": 71.35,
"r_y1": 252.98,
"r_x2": 71.35,
"r_y2": 244.07,
"r_x3": 61.57,
"r_y3": 244.07,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.79,
"r_y0": 252.98,
"r_x1": 286.37,
"r_y1": 252.98,
"r_x2": 286.37,
"r_y2": 244.07,
"r_x3": 73.79,
"r_y3": 244.07,
"coord_origin": "TOPLEFT"
},
"text": "There are occasional inaccuracies in the predictions of",
"orig": "There are occasional inaccuracies in the predictions of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 264.93,
"r_x1": 150.42,
"r_y1": 264.93,
"r_x2": 150.42,
"r_y2": 256.03,
"r_x3": 70.04,
"r_y3": 256.03,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes.",
"orig": "the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 279.2,
"r": 286.37,
"b": 395.71,
"coord_origin": "TOPLEFT"
},
"confidence": 0.977,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 288.11,
"r_x1": 286.36,
"r_y1": 288.11,
"r_x2": 286.36,
"r_y2": 279.2,
"r_x3": 62.07,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "However, it is possible to mitigate those limitations by",
"orig": "However, it is possible to mitigate those limitations by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.06,
"r_x1": 286.37,
"r_y1": 300.06,
"r_x2": 286.37,
"r_y2": 291.16,
"r_x3": 50.11,
"r_y3": 291.16,
"coord_origin": "TOPLEFT"
},
"text": "combining the TableFormer predictions with the informa-",
"orig": "combining the TableFormer predictions with the informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.02,
"r_x1": 286.37,
"r_y1": 312.02,
"r_x2": 286.37,
"r_y2": 303.11,
"r_x3": 50.11,
"r_y3": 303.11,
"coord_origin": "TOPLEFT"
},
"text": "tion already present inside a programmatic PDF document.",
"orig": "tion already present inside a programmatic PDF document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 323.97,
"r_x1": 286.37,
"r_y1": 323.97,
"r_x2": 286.37,
"r_y2": 315.07,
"r_x3": 50.11,
"r_y3": 315.07,
"coord_origin": "TOPLEFT"
},
"text": "More specifically, PDF documents can be seen as a se-",
"orig": "More specifically, PDF documents can be seen as a se-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 335.93,
"r_x1": 286.37,
"r_y1": 335.93,
"r_x2": 286.37,
"r_y2": 327.02,
"r_x3": 50.11,
"r_y3": 327.02,
"coord_origin": "TOPLEFT"
},
"text": "quence of PDF cells where each cell is described by its con-",
"orig": "quence of PDF cells where each cell is described by its con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 347.89,
"r_x1": 286.37,
"r_y1": 347.89,
"r_x2": 286.37,
"r_y2": 338.98,
"r_x3": 50.11,
"r_y3": 338.98,
"coord_origin": "TOPLEFT"
},
"text": "tent and bounding box. If we are able to associate the PDF",
"orig": "tent and bounding box. If we are able to associate the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.84,
"r_x1": 286.37,
"r_y1": 359.84,
"r_x2": 286.37,
"r_y2": 350.93,
"r_x3": 50.11,
"r_y3": 350.93,
"coord_origin": "TOPLEFT"
},
"text": "cells with the predicted table cells, we can directly link the",
"orig": "cells with the predicted table cells, we can directly link the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.8,
"r_x1": 286.37,
"r_y1": 371.8,
"r_x2": 286.37,
"r_y2": 362.89,
"r_x3": 50.11,
"r_y3": 362.89,
"coord_origin": "TOPLEFT"
},
"text": "PDF cell content to the table cell structure and use the PDF",
"orig": "PDF cell content to the table cell structure and use the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 383.75,
"r_x1": 286.37,
"r_y1": 383.75,
"r_x2": 286.37,
"r_y2": 374.84,
"r_x3": 50.11,
"r_y3": 374.84,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes to correct misalignments in the predicted",
"orig": "bounding boxes to correct misalignments in the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 395.71,
"r_x1": 154.56,
"r_y1": 395.71,
"r_x2": 154.56,
"r_y2": 386.8,
"r_x3": 50.11,
"r_y3": 386.8,
"coord_origin": "TOPLEFT"
},
"text": "table cell bounding boxes.",
"orig": "table cell bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 399.07,
"r": 286.36,
"b": 419.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.935,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 407.98,
"r_x1": 286.36,
"r_y1": 407.98,
"r_x2": 286.36,
"r_y2": 399.07,
"r_x3": 62.07,
"r_y3": 399.07,
"coord_origin": "TOPLEFT"
},
"text": "Here is a step-by-step description of the prediction post-",
"orig": "Here is a step-by-step description of the prediction post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 419.93,
"r_x1": 95.49,
"r_y1": 419.93,
"r_x2": 95.49,
"r_y2": 411.03,
"r_x3": 50.11,
"r_y3": 411.03,
"coord_origin": "TOPLEFT"
},
"text": "processing:",
"orig": "processing:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 423.3,
"r": 286.37,
"b": 456.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.828,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 432.2,
"r_x1": 69.37,
"r_y1": 432.2,
"r_x2": 69.37,
"r_y2": 423.3,
"r_x3": 62.07,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.81,
"r_y0": 432.2,
"r_x1": 286.37,
"r_y1": 432.2,
"r_x2": 286.37,
"r_y2": 423.3,
"r_x3": 71.81,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "Get the minimal grid dimensions - number of rows and",
"orig": "Get the minimal grid dimensions - number of rows and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 444.16,
"r_x1": 286.37,
"r_y1": 444.16,
"r_x2": 286.37,
"r_y2": 435.25,
"r_x3": 50.11,
"r_y3": 435.25,
"coord_origin": "TOPLEFT"
},
"text": "columns for the predicted table structure. This represents",
"orig": "columns for the predicted table structure. This represents",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 456.11,
"r_x1": 274.51,
"r_y1": 456.11,
"r_x2": 274.51,
"r_y2": 447.21,
"r_x3": 50.11,
"r_y3": 447.21,
"coord_origin": "TOPLEFT"
},
"text": "the most granular grid for the underlying table structure.",
"orig": "the most granular grid for the underlying table structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 459.48,
"r": 286.37,
"b": 504.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.965,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 468.38,
"r_x1": 69.54,
"r_y1": 468.38,
"r_x2": 69.54,
"r_y2": 459.48,
"r_x3": 62.07,
"r_y3": 459.48,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 77.43,
"r_y0": 468.38,
"r_x1": 286.36,
"r_y1": 468.38,
"r_x2": 286.36,
"r_y2": 459.48,
"r_x3": 77.43,
"r_y3": 459.48,
"coord_origin": "TOPLEFT"
},
"text": "Generate pair-wise matches between the bounding",
"orig": "Generate pair-wise matches between the bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 480.34,
"r_x1": 286.37,
"r_y1": 480.34,
"r_x2": 286.37,
"r_y2": 471.43,
"r_x3": 50.11,
"r_y3": 471.43,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the PDF cells and the predicted cells. The Intersec-",
"orig": "boxes of the PDF cells and the predicted cells. The Intersec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 492.29,
"r_x1": 286.37,
"r_y1": 492.29,
"r_x2": 286.37,
"r_y2": 483.39,
"r_x3": 50.11,
"r_y3": 483.39,
"coord_origin": "TOPLEFT"
},
"text": "tion Over Union (IOU) metric is used to evaluate the quality",
"orig": "tion Over Union (IOU) metric is used to evaluate the quality",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 504.25,
"r_x1": 110.7,
"r_y1": 504.25,
"r_x2": 110.7,
"r_y2": 495.34,
"r_x3": 50.11,
"r_y3": 495.34,
"coord_origin": "TOPLEFT"
},
"text": "of the matches.",
"orig": "of the matches.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 507.61,
"r": 286.36,
"b": 528.47,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 516.52,
"r_x1": 69.86,
"r_y1": 516.52,
"r_x2": 69.86,
"r_y2": 507.61,
"r_x3": 62.07,
"r_y3": 507.61,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.46,
"r_y0": 516.52,
"r_x1": 286.36,
"r_y1": 516.52,
"r_x2": 286.36,
"r_y2": 507.61,
"r_x3": 72.46,
"r_y3": 507.61,
"coord_origin": "TOPLEFT"
},
"text": "Use a carefully selected IOU threshold to designate",
"orig": "Use a carefully selected IOU threshold to designate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 528.47,
"r_x1": 226.07,
"r_y1": 528.47,
"r_x2": 226.07,
"r_y2": 519.57,
"r_x3": 50.11,
"r_y3": 519.57,
"coord_origin": "TOPLEFT"
},
"text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 531.84,
"r": 286.37,
"b": 564.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.949,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 540.74,
"r_x1": 286.36,
"r_y1": 540.74,
"r_x2": 286.36,
"r_y2": 531.84,
"r_x3": 62.07,
"r_y3": 531.84,
"coord_origin": "TOPLEFT"
},
"text": "3.a. If all IOU scores in a column are below the thresh-",
"orig": "3.a. If all IOU scores in a column are below the thresh-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 552.7,
"r_x1": 286.37,
"r_y1": 552.7,
"r_x2": 286.37,
"r_y2": 543.79,
"r_x3": 50.11,
"r_y3": 543.79,
"coord_origin": "TOPLEFT"
},
"text": "old, discard all predictions (structure and bounding boxes)",
"orig": "old, discard all predictions (structure and bounding boxes)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 564.65,
"r_x1": 114.03,
"r_y1": 564.65,
"r_x2": 114.03,
"r_y2": 555.75,
"r_x3": 50.11,
"r_y3": 555.75,
"coord_origin": "TOPLEFT"
},
"text": "for that column.",
"orig": "for that column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 568.02,
"r": 286.37,
"b": 600.83,
"coord_origin": "TOPLEFT"
},
"confidence": 0.959,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 576.92,
"r_x1": 69.54,
"r_y1": 576.92,
"r_x2": 69.54,
"r_y2": 568.02,
"r_x3": 62.07,
"r_y3": 568.02,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.73,
"r_y0": 576.92,
"r_x1": 286.37,
"r_y1": 576.92,
"r_x2": 286.37,
"r_y2": 568.02,
"r_x3": 76.73,
"r_y3": 568.02,
"coord_origin": "TOPLEFT"
},
"text": "Find the best-fitting content alignment for the pre-",
"orig": "Find the best-fitting content alignment for the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 588.88,
"r_x1": 286.37,
"r_y1": 588.88,
"r_x2": 286.37,
"r_y2": 579.97,
"r_x3": 50.11,
"r_y3": 579.97,
"coord_origin": "TOPLEFT"
},
"text": "dicted cells with good IOU per each column. The alignment",
"orig": "dicted cells with good IOU per each column. The alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 600.83,
"r_x1": 278.7,
"r_y1": 600.83,
"r_x2": 278.7,
"r_y2": 591.93,
"r_x3": 50.11,
"r_y3": 591.93,
"coord_origin": "TOPLEFT"
},
"text": "of the column can be identified by the following formula:",
"orig": "of the column can be identified by the following formula:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "formula",
"bbox": {
"l": 110.7,
"t": 623.44,
"r": 286.36,
"b": 654.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.03,
"r_y0": 632.84,
"r_x1": 157.95,
"r_y1": 632.84,
"r_x2": 157.95,
"r_y2": 623.99,
"r_x3": 112.03,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "alignment",
"orig": "alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.72,
"r_y0": 632.84,
"r_x1": 203.5,
"r_y1": 632.84,
"r_x2": 203.5,
"r_y2": 623.99,
"r_x3": 160.72,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "= arg min",
"orig": "= arg min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.58,
"r_y0": 640.18,
"r_x1": 189.15,
"r_y1": 640.18,
"r_x2": 189.15,
"r_y2": 633.98,
"r_x3": 185.58,
"r_y3": 633.98,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 203.5,
"r_y0": 632.84,
"r_x1": 208.48,
"r_y1": 632.84,
"r_x2": 208.48,
"r_y2": 623.44,
"r_x3": 203.5,
"r_y3": 623.44,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.48,
"r_y0": 632.84,
"r_x1": 220.29,
"r_y1": 632.84,
"r_x2": 220.29,
"r_y2": 623.99,
"r_x3": 208.48,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.79,
"r_y0": 632.84,
"r_x1": 225.77,
"r_y1": 632.84,
"r_x2": 225.77,
"r_y2": 623.44,
"r_x3": 220.79,
"r_y3": 623.44,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 654.11,
"r_x1": 122.51,
"r_y1": 654.11,
"r_x2": 122.51,
"r_y2": 645.26,
"r_x3": 110.7,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.78,
"r_y0": 654.11,
"r_x1": 133.53,
"r_y1": 654.11,
"r_x2": 133.53,
"r_y2": 645.26,
"r_x3": 125.78,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 136.29,
"r_y0": 654.11,
"r_x1": 156.0,
"r_y1": 654.11,
"r_x2": 156.0,
"r_y2": 645.26,
"r_x3": 136.29,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "max",
"orig": "max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 654.11,
"r_x1": 160.98,
"r_y1": 654.11,
"r_x2": 160.98,
"r_y2": 644.7,
"r_x3": 156.0,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.98,
"r_y0": 654.11,
"r_x1": 170.24,
"r_y1": 654.11,
"r_x2": 170.24,
"r_y2": 645.26,
"r_x3": 160.98,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.74,
"r_y0": 654.11,
"r_x1": 185.68,
"r_y1": 654.11,
"r_x2": 185.68,
"r_y2": 644.7,
"r_x3": 170.74,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "} \u2212",
"orig": "} \u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.89,
"r_y0": 654.11,
"r_x1": 206.05,
"r_y1": 654.11,
"r_x2": 206.05,
"r_y2": 645.26,
"r_x3": 187.89,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "min",
"orig": "min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.05,
"r_y0": 654.11,
"r_x1": 211.04,
"r_y1": 654.11,
"r_x2": 211.04,
"r_y2": 644.7,
"r_x3": 206.05,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.03,
"r_y0": 654.11,
"r_x1": 220.29,
"r_y1": 654.11,
"r_x2": 220.29,
"r_y2": 645.26,
"r_x3": 211.03,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.79,
"r_y0": 654.11,
"r_x1": 225.77,
"r_y1": 654.11,
"r_x2": 225.77,
"r_y2": 644.7,
"r_x3": 220.79,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 643.79,
"r_x1": 286.36,
"r_y1": 643.79,
"r_x2": 286.36,
"r_y2": 634.89,
"r_x3": 274.75,
"r_y3": 634.89,
"coord_origin": "TOPLEFT"
},
"text": "(4)",
"orig": "(4)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 667.35,
"r": 286.36,
"b": 688.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 676.97,
"r_x1": 74.45,
"r_y1": 676.97,
"r_x2": 74.45,
"r_y2": 668.07,
"r_x3": 50.11,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.34,
"r_y0": 676.75,
"r_x1": 82.65,
"r_y1": 676.75,
"r_x2": 82.65,
"r_y2": 667.91,
"r_x3": 78.34,
"r_y3": 667.91,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.53,
"r_y0": 676.97,
"r_x1": 123.63,
"r_y1": 676.97,
"r_x2": 123.63,
"r_y2": 668.07,
"r_x3": 86.53,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "is one of",
"orig": "is one of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 127.52,
"r_y0": 676.75,
"r_x1": 132.5,
"r_y1": 676.75,
"r_x2": 132.5,
"r_y2": 667.35,
"r_x3": 127.52,
"r_y3": 667.35,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.5,
"r_y0": 676.97,
"r_x1": 210.7,
"r_y1": 676.97,
"r_x2": 210.7,
"r_y2": 668.07,
"r_x3": 132.5,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "left, centroid, right",
"orig": "left, centroid, right",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.7,
"r_y0": 676.75,
"r_x1": 215.68,
"r_y1": 676.75,
"r_x2": 215.68,
"r_y2": 667.35,
"r_x3": 210.7,
"r_y3": 667.35,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.56,
"r_y0": 676.97,
"r_x1": 233.95,
"r_y1": 676.97,
"r_x2": 233.95,
"r_y2": 668.07,
"r_x3": 219.56,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 237.83,
"r_y0": 676.75,
"r_x1": 247.09,
"r_y1": 676.75,
"r_x2": 247.09,
"r_y2": 667.91,
"r_x3": 237.83,
"r_y3": 667.91,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.47,
"r_y0": 676.97,
"r_x1": 286.36,
"r_y1": 676.97,
"r_x2": 286.36,
"r_y2": 668.07,
"r_x3": 251.47,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "is the x-",
"orig": "is the x-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 688.93,
"r_x1": 205.89,
"r_y1": 688.93,
"r_x2": 205.89,
"r_y2": 680.02,
"r_x3": 50.11,
"r_y3": 680.02,
"coord_origin": "TOPLEFT"
},
"text": "coordinate for the corresponding point.",
"orig": "coordinate for the corresponding point.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 692.29,
"r": 286.36,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 701.2,
"r_x1": 69.54,
"r_y1": 701.2,
"r_x2": 69.54,
"r_y2": 692.29,
"r_x3": 62.07,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.27,
"r_y0": 701.2,
"r_x1": 286.36,
"r_y1": 701.2,
"r_x2": 286.36,
"r_y2": 692.29,
"r_x3": 76.27,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Use the alignment computed in step 4, to compute",
"orig": "Use the alignment computed in step 4, to compute",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 94.6,
"r_y1": 713.15,
"r_x2": 94.6,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "the median",
"orig": "the median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.6,
"r_y0": 712.93,
"r_x1": 103.29,
"r_y1": 712.93,
"r_x2": 103.29,
"r_y2": 704.09,
"r_x3": 97.6,
"r_y3": 704.09,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.29,
"r_y0": 713.15,
"r_x1": 286.36,
"r_y1": 713.15,
"r_x2": 286.36,
"r_y2": 704.25,
"r_x3": 103.29,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "-coordinate for all table columns and the me-",
"orig": "-coordinate for all table columns and the me-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 308.86,
"t": 210.93,
"r": 545.12,
"b": 255.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.894,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 219.84,
"r_x1": 545.12,
"r_y1": 219.84,
"r_x2": 545.12,
"r_y2": 210.93,
"r_x3": 308.86,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "dian cell size for all table cells. The usage of median dur-",
"orig": "dian cell size for all table cells. The usage of median dur-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 231.79,
"r_x1": 545.12,
"r_y1": 231.79,
"r_x2": 545.12,
"r_y2": 222.89,
"r_x3": 308.86,
"r_y3": 222.89,
"coord_origin": "TOPLEFT"
},
"text": "ing the computations, helps to eliminate outliers caused by",
"orig": "ing the computations, helps to eliminate outliers caused by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 243.75,
"r_x1": 545.12,
"r_y1": 243.75,
"r_x2": 545.12,
"r_y2": 234.84,
"r_x3": 308.86,
"r_y3": 234.84,
"coord_origin": "TOPLEFT"
},
"text": "occasional column spans which are usually wider than the",
"orig": "occasional column spans which are usually wider than the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 255.7,
"r_x1": 339.58,
"r_y1": 255.7,
"r_x2": 339.58,
"r_y2": 246.8,
"r_x3": 308.86,
"r_y3": 246.8,
"coord_origin": "TOPLEFT"
},
"text": "normal.",
"orig": "normal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 259.1,
"r": 545.11,
"b": 279.96,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 268.01,
"r_x1": 328.29,
"r_y1": 268.01,
"r_x2": 328.29,
"r_y2": 259.1,
"r_x3": 320.82,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 334.88,
"r_y0": 268.01,
"r_x1": 545.11,
"r_y1": 268.01,
"r_x2": 545.11,
"r_y2": 259.1,
"r_x3": 334.88,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "Snap all cells with bad IOU to their corresponding",
"orig": "Snap all cells with bad IOU to their corresponding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 279.96,
"r_x1": 338.19,
"r_y1": 279.96,
"r_x2": 338.19,
"r_y2": 271.06,
"r_x3": 308.86,
"r_y3": 271.06,
"coord_origin": "TOPLEFT"
},
"text": "median",
"orig": "median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 340.68,
"r_y0": 279.74,
"r_x1": 346.38,
"r_y1": 279.74,
"r_x2": 346.38,
"r_y2": 270.9,
"r_x3": 340.68,
"r_y3": 270.9,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.38,
"r_y0": 279.96,
"r_x1": 453.72,
"r_y1": 279.96,
"r_x2": 453.72,
"r_y2": 271.06,
"r_x3": 346.38,
"r_y3": 271.06,
"coord_origin": "TOPLEFT"
},
"text": "-coordinates and cell sizes.",
"orig": "-coordinates and cell sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 283.36,
"r": 545.12,
"b": 387.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 292.27,
"r_x1": 328.39,
"r_y1": 292.27,
"r_x2": 328.39,
"r_y2": 283.36,
"r_x3": 320.82,
"r_y3": 283.36,
"coord_origin": "TOPLEFT"
},
"text": "7.",
"orig": "7.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.91,
"r_y0": 292.27,
"r_x1": 545.11,
"r_y1": 292.27,
"r_x2": 545.11,
"r_y2": 283.36,
"r_x3": 330.91,
"r_y3": 283.36,
"coord_origin": "TOPLEFT"
},
"text": "Generate a new set of pair-wise matches between the",
"orig": "Generate a new set of pair-wise matches between the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.22,
"r_x1": 545.12,
"r_y1": 304.22,
"r_x2": 545.12,
"r_y2": 295.32,
"r_x3": 308.86,
"r_y3": 295.32,
"coord_origin": "TOPLEFT"
},
"text": "corrected bounding boxes and PDF cells. This time use a",
"orig": "corrected bounding boxes and PDF cells. This time use a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.18,
"r_x1": 545.12,
"r_y1": 316.18,
"r_x2": 545.12,
"r_y2": 307.27,
"r_x3": 308.86,
"r_y3": 307.27,
"coord_origin": "TOPLEFT"
},
"text": "modified version of the IOU metric, where the area of the",
"orig": "modified version of the IOU metric, where the area of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 328.13,
"r_x1": 545.12,
"r_y1": 328.13,
"r_x2": 545.12,
"r_y2": 319.23,
"r_x3": 308.86,
"r_y3": 319.23,
"coord_origin": "TOPLEFT"
},
"text": "intersection between the predicted and PDF cells is divided",
"orig": "intersection between the predicted and PDF cells is divided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 340.09,
"r_x1": 397.19,
"r_y1": 340.09,
"r_x2": 397.19,
"r_y2": 331.18,
"r_x3": 308.86,
"r_y3": 331.18,
"coord_origin": "TOPLEFT"
},
"text": "by the PDF cell area.",
"orig": "by the PDF cell area.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.66,
"r_y0": 340.09,
"r_x1": 545.12,
"r_y1": 340.09,
"r_x2": 545.12,
"r_y2": 331.18,
"r_x3": 403.66,
"r_y3": 331.18,
"coord_origin": "TOPLEFT"
},
"text": "In case there are multiple matches",
"orig": "In case there are multiple matches",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 352.05,
"r_x1": 545.12,
"r_y1": 352.05,
"r_x2": 545.12,
"r_y2": 343.14,
"r_x3": 308.86,
"r_y3": 343.14,
"coord_origin": "TOPLEFT"
},
"text": "for the same PDF cell, the prediction with the higher score",
"orig": "for the same PDF cell, the prediction with the higher score",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 364.0,
"r_x1": 545.12,
"r_y1": 364.0,
"r_x2": 545.12,
"r_y2": 355.09,
"r_x3": 308.86,
"r_y3": 355.09,
"coord_origin": "TOPLEFT"
},
"text": "is preferred. This covers the cases where the PDF cells are",
"orig": "is preferred. This covers the cases where the PDF cells are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 375.96,
"r_x1": 545.12,
"r_y1": 375.96,
"r_x2": 545.12,
"r_y2": 367.05,
"r_x3": 308.86,
"r_y3": 367.05,
"coord_origin": "TOPLEFT"
},
"text": "smaller than the area of predicted or corrected prediction",
"orig": "smaller than the area of predicted or corrected prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 387.91,
"r_x1": 329.61,
"r_y1": 387.91,
"r_x2": 329.61,
"r_y2": 379.0,
"r_x3": 308.86,
"r_y3": 379.0,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 391.31,
"r": 545.12,
"b": 459.99,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 400.22,
"r_x1": 328.55,
"r_y1": 400.22,
"r_x2": 328.55,
"r_y2": 391.31,
"r_x3": 320.82,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "8.",
"orig": "8.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.13,
"r_y0": 400.22,
"r_x1": 545.12,
"r_y1": 400.22,
"r_x2": 545.12,
"r_y2": 391.31,
"r_x3": 331.13,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "In some rare occasions, we have noticed that Table-",
"orig": "In some rare occasions, we have noticed that Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.17,
"r_x1": 545.12,
"r_y1": 412.17,
"r_x2": 545.12,
"r_y2": 403.27,
"r_x3": 308.86,
"r_y3": 403.27,
"coord_origin": "TOPLEFT"
},
"text": "Former can confuse a single column as two. When the post-",
"orig": "Former can confuse a single column as two. When the post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.13,
"r_x1": 545.12,
"r_y1": 424.13,
"r_x2": 545.12,
"r_y2": 415.22,
"r_x3": 308.86,
"r_y3": 415.22,
"coord_origin": "TOPLEFT"
},
"text": "processing steps are applied, this results with two predicted",
"orig": "processing steps are applied, this results with two predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.08,
"r_x1": 545.12,
"r_y1": 436.08,
"r_x2": 545.12,
"r_y2": 427.18,
"r_x3": 308.86,
"r_y3": 427.18,
"coord_origin": "TOPLEFT"
},
"text": "columns pointing to the same PDF column. In such case",
"orig": "columns pointing to the same PDF column. In such case",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.04,
"r_x1": 545.12,
"r_y1": 448.04,
"r_x2": 545.12,
"r_y2": 439.13,
"r_x3": 308.86,
"r_y3": 439.13,
"coord_origin": "TOPLEFT"
},
"text": "we must de-duplicate the columns according to highest to-",
"orig": "we must de-duplicate the columns according to highest to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 459.99,
"r_x1": 426.18,
"r_y1": 459.99,
"r_x2": 426.18,
"r_y2": 451.09,
"r_x3": 308.86,
"r_y3": 451.09,
"coord_origin": "TOPLEFT"
},
"text": "tal column intersection score.",
"orig": "tal column intersection score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 463.39,
"r": 545.12,
"b": 567.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 472.3,
"r_x1": 328.67,
"r_y1": 472.3,
"r_x2": 328.67,
"r_y2": 463.39,
"r_x3": 320.82,
"r_y3": 463.39,
"coord_origin": "TOPLEFT"
},
"text": "9.",
"orig": "9.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.29,
"r_y0": 472.3,
"r_x1": 545.11,
"r_y1": 472.3,
"r_x2": 545.11,
"r_y2": 463.39,
"r_x3": 331.29,
"r_y3": 463.39,
"coord_origin": "TOPLEFT"
},
"text": "Pick up the remaining orphan cells. There could be",
"orig": "Pick up the remaining orphan cells. There could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 484.25,
"r_x1": 545.12,
"r_y1": 484.25,
"r_x2": 545.12,
"r_y2": 475.35,
"r_x3": 308.86,
"r_y3": 475.35,
"coord_origin": "TOPLEFT"
},
"text": "cases, when after applying all the previous post-processing",
"orig": "cases, when after applying all the previous post-processing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 496.21,
"r_x1": 545.12,
"r_y1": 496.21,
"r_x2": 545.12,
"r_y2": 487.3,
"r_x3": 308.86,
"r_y3": 487.3,
"coord_origin": "TOPLEFT"
},
"text": "steps, some PDF cells could still remain without any match",
"orig": "steps, some PDF cells could still remain without any match",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 508.16,
"r_x1": 381.9,
"r_y1": 508.16,
"r_x2": 381.9,
"r_y2": 499.26,
"r_x3": 308.86,
"r_y3": 499.26,
"coord_origin": "TOPLEFT"
},
"text": "to predicted cells.",
"orig": "to predicted cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 508.16,
"r_x1": 545.12,
"r_y1": 508.16,
"r_x2": 545.12,
"r_y2": 499.26,
"r_x3": 388.7,
"r_y3": 499.26,
"coord_origin": "TOPLEFT"
},
"text": "However, it is still possible to deduce",
"orig": "However, it is still possible to deduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 520.12,
"r_x1": 545.12,
"r_y1": 520.12,
"r_x2": 545.12,
"r_y2": 511.21,
"r_x3": 308.86,
"r_y3": 511.21,
"coord_origin": "TOPLEFT"
},
"text": "the correct matching for an orphan PDF cell by mapping its",
"orig": "the correct matching for an orphan PDF cell by mapping its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 532.07,
"r_x1": 545.12,
"r_y1": 532.07,
"r_x2": 545.12,
"r_y2": 523.17,
"r_x3": 308.86,
"r_y3": 523.17,
"coord_origin": "TOPLEFT"
},
"text": "bounding box on the geometry of the grid. This mapping",
"orig": "bounding box on the geometry of the grid. This mapping",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 544.03,
"r_x1": 545.11,
"r_y1": 544.03,
"r_x2": 545.11,
"r_y2": 535.12,
"r_x3": 308.86,
"r_y3": 535.12,
"coord_origin": "TOPLEFT"
},
"text": "decides if the content of the orphan cell will be appended to",
"orig": "decides if the content of the orphan cell will be appended to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 555.98,
"r_x1": 545.12,
"r_y1": 555.98,
"r_x2": 545.12,
"r_y2": 547.08,
"r_x3": 308.86,
"r_y3": 547.08,
"coord_origin": "TOPLEFT"
},
"text": "an already matched table cell, or a new table cell should be",
"orig": "an already matched table cell, or a new table cell should be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 567.94,
"r_x1": 442.22,
"r_y1": 567.94,
"r_x2": 442.22,
"r_y2": 559.03,
"r_x3": 308.86,
"r_y3": 559.03,
"coord_origin": "TOPLEFT"
},
"text": "created to match with the orphan.",
"orig": "created to match with the orphan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 308.86,
"t": 571.34,
"r": 545.12,
"b": 604.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.846,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 580.24,
"r_x1": 545.11,
"r_y1": 580.24,
"r_x2": 545.11,
"r_y2": 571.34,
"r_x3": 320.82,
"r_y3": 571.34,
"coord_origin": "TOPLEFT"
},
"text": "9a. Compute the top and bottom boundary of the hori-",
"orig": "9a. Compute the top and bottom boundary of the hori-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 592.2,
"r_x1": 471.64,
"r_y1": 592.2,
"r_x2": 471.64,
"r_y2": 583.29,
"r_x3": 308.86,
"r_y3": 583.29,
"coord_origin": "TOPLEFT"
},
"text": "zontal band for each grid row (min/max",
"orig": "zontal band for each grid row (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.83,
"r_y0": 591.98,
"r_x1": 479.72,
"r_y1": 591.98,
"r_x2": 479.72,
"r_y2": 583.13,
"r_x3": 474.83,
"r_y3": 583.13,
"coord_origin": "TOPLEFT"
},
"text": "y",
"orig": "y",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.27,
"r_y0": 592.2,
"r_x1": 545.12,
"r_y1": 592.2,
"r_x2": 545.12,
"r_y2": 583.29,
"r_x3": 483.27,
"r_y3": 583.29,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per",
"orig": "coordinates per",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 604.15,
"r_x1": 329.91,
"r_y1": 604.15,
"r_x2": 329.91,
"r_y2": 595.25,
"r_x3": 308.86,
"r_y3": 595.25,
"coord_origin": "TOPLEFT"
},
"text": "row).",
"orig": "row).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 607.55,
"r": 545.12,
"b": 628.42,
"coord_origin": "TOPLEFT"
},
"confidence": 0.772,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 616.46,
"r_x1": 332.87,
"r_y1": 616.46,
"r_x2": 332.87,
"r_y2": 607.55,
"r_x3": 320.82,
"r_y3": 607.55,
"coord_origin": "TOPLEFT"
},
"text": "9b.",
"orig": "9b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.93,
"r_y0": 616.46,
"r_x1": 545.12,
"r_y1": 616.46,
"r_x2": 545.12,
"r_y2": 607.55,
"r_x3": 339.93,
"r_y3": 607.55,
"coord_origin": "TOPLEFT"
},
"text": "Intersect the orphan\u2019s bounding box with the row",
"orig": "Intersect the orphan\u2019s bounding box with the row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 628.42,
"r_x1": 495.29,
"r_y1": 628.42,
"r_x2": 495.29,
"r_y2": 619.51,
"r_x3": 308.86,
"r_y3": 619.51,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid row.",
"orig": "bands, and map the cell to the closest grid row.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 631.81,
"r": 545.12,
"b": 664.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.858,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 640.72,
"r_x1": 545.12,
"r_y1": 640.72,
"r_x2": 545.12,
"r_y2": 631.81,
"r_x3": 320.82,
"r_y3": 631.81,
"coord_origin": "TOPLEFT"
},
"text": "9c. Compute the left and right boundary of the vertical",
"orig": "9c. Compute the left and right boundary of the vertical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 652.68,
"r_x1": 455.28,
"r_y1": 652.68,
"r_x2": 455.28,
"r_y2": 643.77,
"r_x3": 308.86,
"r_y3": 643.77,
"coord_origin": "TOPLEFT"
},
"text": "band for each grid column (min/max",
"orig": "band for each grid column (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 457.78,
"r_y0": 652.46,
"r_x1": 463.47,
"r_y1": 652.46,
"r_x2": 463.47,
"r_y2": 643.61,
"r_x3": 457.78,
"r_y3": 643.61,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.97,
"r_y0": 652.68,
"r_x1": 545.11,
"r_y1": 652.68,
"r_x2": 545.11,
"r_y2": 643.77,
"r_x3": 465.97,
"r_y3": 643.77,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per col-",
"orig": "coordinates per col-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 664.63,
"r_x1": 332.38,
"r_y1": 664.63,
"r_x2": 332.38,
"r_y2": 655.72,
"r_x3": 308.86,
"r_y3": 655.72,
"coord_origin": "TOPLEFT"
},
"text": "umn).",
"orig": "umn).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 668.03,
"r": 545.11,
"b": 688.89,
"coord_origin": "TOPLEFT"
},
"confidence": 0.759,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 676.94,
"r_x1": 545.11,
"r_y1": 676.94,
"r_x2": 545.11,
"r_y2": 668.03,
"r_x3": 320.82,
"r_y3": 668.03,
"coord_origin": "TOPLEFT"
},
"text": "9d. Intersect the orphan\u2019s bounding box with the column",
"orig": "9d. Intersect the orphan\u2019s bounding box with the column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 688.89,
"r_x1": 510.58,
"r_y1": 688.89,
"r_x2": 510.58,
"r_y2": 679.99,
"r_x3": 308.86,
"r_y3": 679.99,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid column.",
"orig": "bands, and map the cell to the closest grid column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 692.29,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.697,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 320.82,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "9e. If the table cell under the identified row and column",
"orig": "9e. If the table cell under the identified row and column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "is not empty, extend its content with the content of the or-",
"orig": "is not empty, extend its content with the content of the or-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "picture",
"id": 30,
"page_no": 11,
"cluster": {
"id": 30,
"label": "picture",
"bbox": {
"l": 53.54,
"t": 74.75,
"r": 544.94,
"b": 147.59,
"coord_origin": "TOPLEFT"
},
"confidence": 0.603,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.39,
"r_y0": 83.26,
"r_x1": 151.95,
"r_y1": 83.26,
"r_x2": 151.95,
"r_y2": 77.31,
"r_x3": 119.39,
"r_y3": 77.31,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.35,
"r_y0": 81.14,
"r_x1": 59.33,
"r_y1": 81.14,
"r_x2": 59.33,
"r_y2": 75.19,
"r_x3": 53.35,
"r_y3": 75.19,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.58,
"r_y0": 83.41,
"r_x1": 319.83,
"r_y1": 83.41,
"r_x2": 319.83,
"r_y2": 77.46,
"r_x3": 289.58,
"r_y3": 77.46,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.37,
"r_y0": 83.2,
"r_x1": 481.76,
"r_y1": 83.2,
"r_x2": 481.76,
"r_y2": 77.25,
"r_x3": 448.37,
"r_y3": 77.25,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.55,
"r_y0": 146.23,
"r_x1": 94.98,
"r_y1": 146.23,
"r_x2": 94.98,
"r_y2": 141.28,
"r_x3": 82.55,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.04,
"r_y0": 106.06,
"r_x1": 85.29,
"r_y1": 106.06,
"r_x2": 85.29,
"r_y2": 101.1,
"r_x3": 63.04,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 129.35,
"r_x1": 85.23,
"r_y1": 129.35,
"r_x2": 85.23,
"r_y2": 124.4,
"r_x3": 67.77,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.55,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.54,
"r_x3": 227.55,
"r_y3": 102.54,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.94,
"r_x1": 249.66,
"r_y1": 131.94,
"r_x2": 249.66,
"r_y2": 126.99,
"r_x3": 232.2,
"r_y3": 126.99,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.23,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.05,
"r_x3": 396.23,
"r_y3": 114.05,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.38,
"r_y0": 146.23,
"r_x1": 105.08,
"r_y1": 146.23,
"r_x2": 105.08,
"r_y2": 141.28,
"r_x3": 97.38,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.94,
"r_y0": 90.69,
"r_x1": 76.15,
"r_y1": 90.69,
"r_x2": 76.15,
"r_y2": 85.73,
"r_x3": 60.94,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.18,
"r_x1": 106.99,
"r_y1": 91.18,
"r_x2": 106.99,
"r_y2": 86.22,
"r_x3": 82.3,
"r_y3": 86.22,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.21,
"r_y0": 146.56,
"r_x1": 281.88,
"r_y1": 146.56,
"r_x2": 281.88,
"r_y2": 141.61,
"r_x3": 246.21,
"r_y3": 141.61,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.69,
"r_x1": 241.91,
"r_y1": 90.69,
"r_x2": 241.91,
"r_y2": 85.73,
"r_x3": 226.7,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.94,
"r_y0": 91.05,
"r_x1": 282.49,
"r_y1": 91.05,
"r_x2": 282.49,
"r_y2": 86.09,
"r_x3": 249.94,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.19,
"r_y0": 146.23,
"r_x1": 444.69,
"r_y1": 146.23,
"r_x2": 444.69,
"r_y2": 141.28,
"r_x3": 410.19,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 90.69,
"r_x1": 432.67,
"r_y1": 90.69,
"r_x2": 432.67,
"r_y2": 85.73,
"r_x3": 391.37,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.61,
"r_y0": 91.22,
"r_x1": 445.62,
"r_y1": 91.22,
"r_x2": 445.62,
"r_y2": 86.26,
"r_x3": 435.61,
"r_y3": 86.26,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.95,
"r_y0": 146.25,
"r_x1": 136.2,
"r_y1": 146.25,
"r_x2": 136.2,
"r_y2": 141.29,
"r_x3": 113.95,
"r_y3": 141.29,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.92,
"r_y0": 99.78,
"r_x1": 127.05,
"r_y1": 99.78,
"r_x2": 127.05,
"r_y2": 94.82,
"r_x3": 116.92,
"r_y3": 94.82,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.31,
"r_y0": 105.9,
"r_x1": 127.05,
"r_y1": 105.9,
"r_x2": 127.05,
"r_y2": 100.94,
"r_x3": 113.31,
"r_y3": 100.94,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.94,
"r_y0": 112.02,
"r_x1": 127.06,
"r_y1": 112.02,
"r_x2": 127.06,
"r_y2": 107.06,
"r_x3": 112.94,
"r_y3": 107.06,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.23,
"r_y0": 127.57,
"r_x1": 126.97,
"r_y1": 127.57,
"r_x2": 126.97,
"r_y2": 122.62,
"r_x3": 113.23,
"r_y3": 122.62,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.85,
"r_y0": 133.69,
"r_x1": 126.97,
"r_y1": 133.69,
"r_x2": 126.97,
"r_y2": 128.74,
"r_x3": 112.85,
"r_y3": 128.74,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.58,
"r_y0": 146.39,
"r_x1": 156.04,
"r_y1": 146.39,
"r_x2": 156.04,
"r_y2": 141.44,
"r_x3": 138.58,
"r_y3": 141.44,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.03,
"r_y0": 91.23,
"r_x1": 151.04,
"r_y1": 91.23,
"r_x2": 151.04,
"r_y2": 86.27,
"r_x3": 122.03,
"r_y3": 86.27,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.65,
"r_y0": 91.51,
"r_x1": 321.67,
"r_y1": 91.51,
"r_x2": 321.67,
"r_y2": 86.55,
"r_x3": 311.65,
"r_y3": 86.55,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.89,
"r_y0": 146.67,
"r_x1": 310.15,
"r_y1": 146.67,
"r_x2": 310.15,
"r_y2": 141.71,
"r_x3": 287.89,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.24,
"r_y0": 98.04,
"r_x1": 299.37,
"r_y1": 98.04,
"r_x2": 299.37,
"r_y2": 93.08,
"r_x3": 289.24,
"r_y3": 93.08,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.64,
"r_y0": 104.16,
"r_x1": 299.37,
"r_y1": 104.16,
"r_x2": 299.37,
"r_y2": 99.2,
"r_x3": 285.64,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.26,
"r_y0": 110.28,
"r_x1": 299.38,
"r_y1": 110.28,
"r_x2": 299.38,
"r_y2": 105.32,
"r_x3": 285.26,
"r_y3": 105.32,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.43,
"r_y0": 125.35,
"r_x1": 299.17,
"r_y1": 125.35,
"r_x2": 299.17,
"r_y2": 120.39,
"r_x3": 285.43,
"r_y3": 120.39,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.06,
"r_y0": 131.47,
"r_x1": 299.17,
"r_y1": 131.47,
"r_x2": 299.17,
"r_y2": 126.51,
"r_x3": 285.06,
"r_y3": 126.51,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.35,
"r_y0": 146.67,
"r_x1": 328.81,
"r_y1": 146.67,
"r_x2": 328.81,
"r_y2": 141.71,
"r_x3": 311.35,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.58,
"r_y0": 91.65,
"r_x1": 309.6,
"r_y1": 91.65,
"r_x2": 309.6,
"r_y2": 86.69,
"r_x3": 299.58,
"r_y3": 86.69,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.04,
"r_y0": 146.63,
"r_x1": 483.5,
"r_y1": 146.63,
"r_x2": 483.5,
"r_y2": 141.67,
"r_x3": 466.04,
"r_y3": 141.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.02,
"r_y0": 98.72,
"r_x1": 469.16,
"r_y1": 98.72,
"r_x2": 469.16,
"r_y2": 93.76,
"r_x3": 459.02,
"r_y3": 93.76,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.42,
"r_y0": 104.84,
"r_x1": 469.16,
"r_y1": 104.84,
"r_x2": 469.16,
"r_y2": 99.88,
"r_x3": 455.42,
"r_y3": 99.88,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.05,
"r_y0": 110.96,
"r_x1": 469.16,
"r_y1": 110.96,
"r_x2": 469.16,
"r_y2": 106.0,
"r_x3": 455.05,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.39,
"r_y0": 90.53,
"r_x1": 480.65,
"r_y1": 90.53,
"r_x2": 480.65,
"r_y2": 85.57,
"r_x3": 467.39,
"r_y3": 85.57,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.38,
"r_y0": 146.54,
"r_x1": 182.63,
"r_y1": 146.54,
"r_x2": 182.63,
"r_y2": 141.58,
"r_x3": 160.38,
"r_y3": 141.58,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.74,
"r_y0": 99.82,
"r_x1": 173.33,
"r_y1": 99.82,
"r_x2": 173.33,
"r_y2": 94.86,
"r_x3": 153.74,
"r_y3": 94.86,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.51,
"r_y0": 105.94,
"r_x1": 173.32,
"r_y1": 105.94,
"r_x2": 173.32,
"r_y2": 100.98,
"r_x3": 154.51,
"r_y3": 100.98,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.27,
"r_y0": 112.06,
"r_x1": 173.33,
"r_y1": 112.06,
"r_x2": 173.33,
"r_y2": 107.1,
"r_x3": 155.27,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.41,
"r_y0": 112.19,
"r_x1": 346.0,
"r_y1": 112.19,
"r_x2": 346.0,
"r_y2": 107.23,
"r_x3": 326.41,
"r_y3": 107.23,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.18,
"r_y0": 118.31,
"r_x1": 345.99,
"r_y1": 118.31,
"r_x2": 345.99,
"r_y2": 113.35,
"r_x3": 327.18,
"r_y3": 113.35,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.94,
"r_y0": 124.43,
"r_x1": 346.0,
"r_y1": 124.43,
"r_x2": 346.0,
"r_y2": 119.47,
"r_x3": 327.94,
"r_y3": 119.47,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.99,
"r_y0": 109.11,
"r_x1": 508.76,
"r_y1": 109.11,
"r_x2": 508.76,
"r_y2": 104.15,
"r_x3": 488.99,
"r_y3": 104.15,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.19,
"r_y0": 115.23,
"r_x1": 508.76,
"r_y1": 115.23,
"r_x2": 508.76,
"r_y2": 110.27,
"r_x3": 490.19,
"r_y3": 110.27,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.72,
"r_y0": 121.35,
"r_x1": 508.77,
"r_y1": 121.35,
"r_x2": 508.77,
"r_y2": 116.39,
"r_x3": 489.72,
"r_y3": 116.39,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.71,
"r_y0": 127.47,
"r_x1": 508.77,
"r_y1": 127.47,
"r_x2": 508.77,
"r_y2": 122.51,
"r_x3": 490.71,
"r_y3": 122.51,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.38,
"r_y0": 146.67,
"r_x1": 202.84,
"r_y1": 146.67,
"r_x2": 202.84,
"r_y2": 141.71,
"r_x3": 185.38,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.09,
"r_x1": 197.53,
"r_y1": 91.09,
"r_x2": 197.53,
"r_y2": 86.14,
"r_x3": 168.5,
"r_y3": 86.14,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.38,
"r_y0": 90.95,
"r_x1": 367.4,
"r_y1": 90.95,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.38,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.73,
"r_y0": 146.58,
"r_x1": 374.93,
"r_y1": 146.58,
"r_x2": 374.93,
"r_y2": 141.62,
"r_x3": 333.73,
"r_y3": 141.62,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.69,
"r_y0": 91.01,
"r_x1": 355.71,
"r_y1": 91.01,
"r_x2": 355.71,
"r_y2": 86.06,
"r_x3": 345.69,
"r_y3": 86.06,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.54,
"r_y0": 146.33,
"r_x1": 526.01,
"r_y1": 146.33,
"r_x2": 526.01,
"r_y2": 141.38,
"r_x3": 508.54,
"r_y3": 141.38,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.45,
"r_y0": 91.05,
"r_x1": 523.71,
"r_y1": 91.05,
"r_x2": 523.71,
"r_y2": 86.09,
"r_x3": 510.45,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 46,
"label": "text",
"bbox": {
"l": 119.39,
"t": 77.31,
"r": 151.95,
"b": 83.26,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.39,
"r_y0": 83.26,
"r_x1": 151.95,
"r_y1": 83.26,
"r_x2": 151.95,
"r_y2": 77.31,
"r_x3": 119.39,
"r_y3": 77.31,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 53.35,
"t": 75.19,
"r": 59.33,
"b": 81.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.35,
"r_y0": 81.14,
"r_x1": 59.33,
"r_y1": 81.14,
"r_x2": 59.33,
"r_y2": 75.19,
"r_x3": 53.35,
"r_y3": 75.19,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 289.58,
"t": 77.46,
"r": 319.83,
"b": 83.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.58,
"r_y0": 83.41,
"r_x1": 319.83,
"r_y1": 83.41,
"r_x2": 319.83,
"r_y2": 77.46,
"r_x3": 289.58,
"r_y3": 77.46,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 448.37,
"t": 77.25,
"r": 481.76,
"b": 83.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.37,
"r_y0": 83.2,
"r_x1": 481.76,
"r_y1": 83.2,
"r_x2": 481.76,
"r_y2": 77.25,
"r_x3": 448.37,
"r_y3": 77.25,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 82.55,
"t": 141.28,
"r": 94.98,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.55,
"r_y0": 146.23,
"r_x1": 94.98,
"r_y1": 146.23,
"r_x2": 94.98,
"r_y2": 141.28,
"r_x3": 82.55,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 63.04,
"t": 101.1,
"r": 85.29,
"b": 106.06,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.04,
"r_y0": 106.06,
"r_x1": 85.29,
"r_y1": 106.06,
"r_x2": 85.29,
"r_y2": 101.1,
"r_x3": 63.04,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 67.77,
"t": 124.4,
"r": 85.23,
"b": 129.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 129.35,
"r_x1": 85.23,
"r_y1": 129.35,
"r_x2": 85.23,
"r_y2": 124.4,
"r_x3": 67.77,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 227.55,
"t": 102.54,
"r": 249.8,
"b": 107.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.55,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.54,
"r_x3": 227.55,
"r_y3": 102.54,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 232.2,
"t": 126.99,
"r": 249.66,
"b": 131.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.94,
"r_x1": 249.66,
"r_y1": 131.94,
"r_x2": 249.66,
"r_y2": 126.99,
"r_x3": 232.2,
"r_y3": 126.99,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 396.23,
"t": 114.05,
"r": 413.7,
"b": 119.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.23,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.05,
"r_x3": 396.23,
"r_y3": 114.05,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 97.38,
"t": 141.28,
"r": 105.08,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.38,
"r_y0": 146.23,
"r_x1": 105.08,
"r_y1": 146.23,
"r_x2": 105.08,
"r_y2": 141.28,
"r_x3": 97.38,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 60.94,
"t": 85.73,
"r": 76.15,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.94,
"r_y0": 90.69,
"r_x1": 76.15,
"r_y1": 90.69,
"r_x2": 76.15,
"r_y2": 85.73,
"r_x3": 60.94,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 82.3,
"t": 86.22,
"r": 106.99,
"b": 91.18,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.18,
"r_x1": 106.99,
"r_y1": 91.18,
"r_x2": 106.99,
"r_y2": 86.22,
"r_x3": 82.3,
"r_y3": 86.22,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 246.21,
"t": 141.61,
"r": 281.88,
"b": 146.56,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.21,
"r_y0": 146.56,
"r_x1": 281.88,
"r_y1": 146.56,
"r_x2": 281.88,
"r_y2": 141.61,
"r_x3": 246.21,
"r_y3": 141.61,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 226.7,
"t": 85.73,
"r": 241.91,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.69,
"r_x1": 241.91,
"r_y1": 90.69,
"r_x2": 241.91,
"r_y2": 85.73,
"r_x3": 226.7,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 249.94,
"t": 86.09,
"r": 282.49,
"b": 91.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.94,
"r_y0": 91.05,
"r_x1": 282.49,
"r_y1": 91.05,
"r_x2": 282.49,
"r_y2": 86.09,
"r_x3": 249.94,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 410.19,
"t": 141.28,
"r": 444.69,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.19,
"r_y0": 146.23,
"r_x1": 444.69,
"r_y1": 146.23,
"r_x2": 444.69,
"r_y2": 141.28,
"r_x3": 410.19,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 391.37,
"t": 85.73,
"r": 432.67,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 90.69,
"r_x1": 432.67,
"r_y1": 90.69,
"r_x2": 432.67,
"r_y2": 85.73,
"r_x3": 391.37,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 435.61,
"t": 86.26,
"r": 445.62,
"b": 91.22,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.61,
"r_y0": 91.22,
"r_x1": 445.62,
"r_y1": 91.22,
"r_x2": 445.62,
"r_y2": 86.26,
"r_x3": 435.61,
"r_y3": 86.26,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 113.95,
"t": 141.29,
"r": 136.2,
"b": 146.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.95,
"r_y0": 146.25,
"r_x1": 136.2,
"r_y1": 146.25,
"r_x2": 136.2,
"r_y2": 141.29,
"r_x3": 113.95,
"r_y3": 141.29,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 116.92,
"t": 94.82,
"r": 127.05,
"b": 99.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.92,
"r_y0": 99.78,
"r_x1": 127.05,
"r_y1": 99.78,
"r_x2": 127.05,
"r_y2": 94.82,
"r_x3": 116.92,
"r_y3": 94.82,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 113.31,
"t": 100.94,
"r": 127.05,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.31,
"r_y0": 105.9,
"r_x1": 127.05,
"r_y1": 105.9,
"r_x2": 127.05,
"r_y2": 100.94,
"r_x3": 113.31,
"r_y3": 100.94,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 112.94,
"t": 107.06,
"r": 127.06,
"b": 112.02,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.94,
"r_y0": 112.02,
"r_x1": 127.06,
"r_y1": 112.02,
"r_x2": 127.06,
"r_y2": 107.06,
"r_x3": 112.94,
"r_y3": 107.06,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 113.23,
"t": 122.62,
"r": 126.97,
"b": 127.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.23,
"r_y0": 127.57,
"r_x1": 126.97,
"r_y1": 127.57,
"r_x2": 126.97,
"r_y2": 122.62,
"r_x3": 113.23,
"r_y3": 122.62,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 112.85,
"t": 128.74,
"r": 126.97,
"b": 133.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.85,
"r_y0": 133.69,
"r_x1": 126.97,
"r_y1": 133.69,
"r_x2": 126.97,
"r_y2": 128.74,
"r_x3": 112.85,
"r_y3": 128.74,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 138.58,
"t": 141.44,
"r": 156.04,
"b": 146.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.58,
"r_y0": 146.39,
"r_x1": 156.04,
"r_y1": 146.39,
"r_x2": 156.04,
"r_y2": 141.44,
"r_x3": 138.58,
"r_y3": 141.44,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 122.03,
"t": 86.27,
"r": 151.04,
"b": 91.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.03,
"r_y0": 91.23,
"r_x1": 151.04,
"r_y1": 91.23,
"r_x2": 151.04,
"r_y2": 86.27,
"r_x3": 122.03,
"r_y3": 86.27,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 311.65,
"t": 86.55,
"r": 321.67,
"b": 91.51,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.65,
"r_y0": 91.51,
"r_x1": 321.67,
"r_y1": 91.51,
"r_x2": 321.67,
"r_y2": 86.55,
"r_x3": 311.65,
"r_y3": 86.55,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 287.89,
"t": 141.71,
"r": 310.15,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.89,
"r_y0": 146.67,
"r_x1": 310.15,
"r_y1": 146.67,
"r_x2": 310.15,
"r_y2": 141.71,
"r_x3": 287.89,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 289.24,
"t": 93.08,
"r": 299.37,
"b": 98.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.24,
"r_y0": 98.04,
"r_x1": 299.37,
"r_y1": 98.04,
"r_x2": 299.37,
"r_y2": 93.08,
"r_x3": 289.24,
"r_y3": 93.08,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 285.64,
"t": 99.2,
"r": 299.37,
"b": 104.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.64,
"r_y0": 104.16,
"r_x1": 299.37,
"r_y1": 104.16,
"r_x2": 299.37,
"r_y2": 99.2,
"r_x3": 285.64,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 285.26,
"t": 105.32,
"r": 299.38,
"b": 110.28,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.26,
"r_y0": 110.28,
"r_x1": 299.38,
"r_y1": 110.28,
"r_x2": 299.38,
"r_y2": 105.32,
"r_x3": 285.26,
"r_y3": 105.32,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 285.43,
"t": 120.39,
"r": 299.17,
"b": 125.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.43,
"r_y0": 125.35,
"r_x1": 299.17,
"r_y1": 125.35,
"r_x2": 299.17,
"r_y2": 120.39,
"r_x3": 285.43,
"r_y3": 120.39,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 285.06,
"t": 126.51,
"r": 299.17,
"b": 131.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.06,
"r_y0": 131.47,
"r_x1": 299.17,
"r_y1": 131.47,
"r_x2": 299.17,
"r_y2": 126.51,
"r_x3": 285.06,
"r_y3": 126.51,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 311.35,
"t": 141.71,
"r": 328.81,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.35,
"r_y0": 146.67,
"r_x1": 328.81,
"r_y1": 146.67,
"r_x2": 328.81,
"r_y2": 141.71,
"r_x3": 311.35,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 299.58,
"t": 86.69,
"r": 309.6,
"b": 91.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.58,
"r_y0": 91.65,
"r_x1": 309.6,
"r_y1": 91.65,
"r_x2": 309.6,
"r_y2": 86.69,
"r_x3": 299.58,
"r_y3": 86.69,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 466.04,
"t": 141.67,
"r": 483.5,
"b": 146.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.04,
"r_y0": 146.63,
"r_x1": 483.5,
"r_y1": 146.63,
"r_x2": 483.5,
"r_y2": 141.67,
"r_x3": 466.04,
"r_y3": 141.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 459.02,
"t": 93.76,
"r": 469.16,
"b": 98.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.02,
"r_y0": 98.72,
"r_x1": 469.16,
"r_y1": 98.72,
"r_x2": 469.16,
"r_y2": 93.76,
"r_x3": 459.02,
"r_y3": 93.76,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 455.42,
"t": 99.88,
"r": 469.16,
"b": 104.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.42,
"r_y0": 104.84,
"r_x1": 469.16,
"r_y1": 104.84,
"r_x2": 469.16,
"r_y2": 99.88,
"r_x3": 455.42,
"r_y3": 99.88,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 455.05,
"t": 106.0,
"r": 469.16,
"b": 110.96,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.05,
"r_y0": 110.96,
"r_x1": 469.16,
"r_y1": 110.96,
"r_x2": 469.16,
"r_y2": 106.0,
"r_x3": 455.05,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 467.39,
"t": 85.57,
"r": 480.65,
"b": 90.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.39,
"r_y0": 90.53,
"r_x1": 480.65,
"r_y1": 90.53,
"r_x2": 480.65,
"r_y2": 85.57,
"r_x3": 467.39,
"r_y3": 85.57,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 160.38,
"t": 141.58,
"r": 182.63,
"b": 146.54,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.38,
"r_y0": 146.54,
"r_x1": 182.63,
"r_y1": 146.54,
"r_x2": 182.63,
"r_y2": 141.58,
"r_x3": 160.38,
"r_y3": 141.58,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 153.74,
"t": 94.86,
"r": 173.33,
"b": 99.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.74,
"r_y0": 99.82,
"r_x1": 173.33,
"r_y1": 99.82,
"r_x2": 173.33,
"r_y2": 94.86,
"r_x3": 153.74,
"r_y3": 94.86,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 154.51,
"t": 100.98,
"r": 173.32,
"b": 105.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.51,
"r_y0": 105.94,
"r_x1": 173.32,
"r_y1": 105.94,
"r_x2": 173.32,
"r_y2": 100.98,
"r_x3": 154.51,
"r_y3": 100.98,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 155.27,
"t": 107.1,
"r": 173.33,
"b": 112.06,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.27,
"r_y0": 112.06,
"r_x1": 173.33,
"r_y1": 112.06,
"r_x2": 173.33,
"r_y2": 107.1,
"r_x3": 155.27,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.41,
"t": 107.23,
"r": 346.0,
"b": 112.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.41,
"r_y0": 112.19,
"r_x1": 346.0,
"r_y1": 112.19,
"r_x2": 346.0,
"r_y2": 107.23,
"r_x3": 326.41,
"r_y3": 107.23,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 327.18,
"t": 113.35,
"r": 345.99,
"b": 118.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.18,
"r_y0": 118.31,
"r_x1": 345.99,
"r_y1": 118.31,
"r_x2": 345.99,
"r_y2": 113.35,
"r_x3": 327.18,
"r_y3": 113.35,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 327.94,
"t": 119.47,
"r": 346.0,
"b": 124.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.94,
"r_y0": 124.43,
"r_x1": 346.0,
"r_y1": 124.43,
"r_x2": 346.0,
"r_y2": 119.47,
"r_x3": 327.94,
"r_y3": 119.47,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 488.99,
"t": 104.15,
"r": 508.76,
"b": 109.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.99,
"r_y0": 109.11,
"r_x1": 508.76,
"r_y1": 109.11,
"r_x2": 508.76,
"r_y2": 104.15,
"r_x3": 488.99,
"r_y3": 104.15,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 490.19,
"t": 110.27,
"r": 508.76,
"b": 115.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.19,
"r_y0": 115.23,
"r_x1": 508.76,
"r_y1": 115.23,
"r_x2": 508.76,
"r_y2": 110.27,
"r_x3": 490.19,
"r_y3": 110.27,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 489.72,
"t": 116.39,
"r": 508.77,
"b": 121.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.72,
"r_y0": 121.35,
"r_x1": 508.77,
"r_y1": 121.35,
"r_x2": 508.77,
"r_y2": 116.39,
"r_x3": 489.72,
"r_y3": 116.39,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 490.71,
"t": 122.51,
"r": 508.77,
"b": 127.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.71,
"r_y0": 127.47,
"r_x1": 508.77,
"r_y1": 127.47,
"r_x2": 508.77,
"r_y2": 122.51,
"r_x3": 490.71,
"r_y3": 122.51,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 185.38,
"t": 141.71,
"r": 202.84,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.38,
"r_y0": 146.67,
"r_x1": 202.84,
"r_y1": 146.67,
"r_x2": 202.84,
"r_y2": 141.71,
"r_x3": 185.38,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 168.5,
"t": 86.14,
"r": 197.53,
"b": 91.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.09,
"r_x1": 197.53,
"r_y1": 91.09,
"r_x2": 197.53,
"r_y2": 86.14,
"r_x3": 168.5,
"r_y3": 86.14,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 357.38,
"t": 86.0,
"r": 367.4,
"b": 90.95,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.38,
"r_y0": 90.95,
"r_x1": 367.4,
"r_y1": 90.95,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.38,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 333.73,
"t": 141.62,
"r": 374.93,
"b": 146.58,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.73,
"r_y0": 146.58,
"r_x1": 374.93,
"r_y1": 146.58,
"r_x2": 374.93,
"r_y2": 141.62,
"r_x3": 333.73,
"r_y3": 141.62,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 345.69,
"t": 86.06,
"r": 355.71,
"b": 91.01,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.69,
"r_y0": 91.01,
"r_x1": 355.71,
"r_y1": 91.01,
"r_x2": 355.71,
"r_y2": 86.06,
"r_x3": 345.69,
"r_y3": 86.06,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 508.54,
"t": 141.38,
"r": 526.01,
"b": 146.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.54,
"r_y0": 146.33,
"r_x1": 526.01,
"r_y1": 146.33,
"r_x2": 526.01,
"r_y2": 141.38,
"r_x3": 508.54,
"r_y3": 141.38,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 510.45,
"t": 86.09,
"r": 523.71,
"b": 91.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.45,
"r_y0": 91.05,
"r_x1": 523.71,
"r_y1": 91.05,
"r_x2": 523.71,
"r_y2": 86.09,
"r_x3": 510.45,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 1,
"page_no": 11,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 165.5,
"r": 545.11,
"b": 186.36,
"coord_origin": "TOPLEFT"
},
"confidence": 0.966,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 174.41,
"r_x1": 545.11,
"r_y1": 174.41,
"r_x2": 545.11,
"r_y2": 165.5,
"r_x3": 50.11,
"r_y3": 165.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 186.36,
"r_x1": 513.52,
"r_y1": 186.36,
"r_x2": 513.52,
"r_y2": 177.46,
"r_x3": 50.11,
"r_y3": 177.46,
"coord_origin": "TOPLEFT"
},
"text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity."
},
{
"label": "list_item",
"id": 4,
"page_no": 11,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 210.93,
"r": 286.37,
"b": 231.79,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 219.84,
"r_x1": 71.15,
"r_y1": 219.84,
"r_x2": 71.15,
"r_y2": 210.93,
"r_x3": 61.57,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.54,
"r_y0": 219.84,
"r_x1": 286.37,
"r_y1": 219.84,
"r_x2": 286.37,
"r_y2": 210.93,
"r_x3": 73.54,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer output does not include the table cell con-",
"orig": "TableFormer output does not include the table cell con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 231.79,
"r_x1": 87.47,
"r_y1": 231.79,
"r_x2": 87.47,
"r_y2": 222.89,
"r_x3": 70.04,
"r_y3": 222.89,
"coord_origin": "TOPLEFT"
},
"text": "tent.",
"orig": "tent.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 TableFormer output does not include the table cell content."
},
{
"label": "list_item",
"id": 3,
"page_no": 11,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 244.07,
"r": 286.37,
"b": 264.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.963,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 252.98,
"r_x1": 71.35,
"r_y1": 252.98,
"r_x2": 71.35,
"r_y2": 244.07,
"r_x3": 61.57,
"r_y3": 244.07,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.79,
"r_y0": 252.98,
"r_x1": 286.37,
"r_y1": 252.98,
"r_x2": 286.37,
"r_y2": 244.07,
"r_x3": 73.79,
"r_y3": 244.07,
"coord_origin": "TOPLEFT"
},
"text": "There are occasional inaccuracies in the predictions of",
"orig": "There are occasional inaccuracies in the predictions of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 264.93,
"r_x1": 150.42,
"r_y1": 264.93,
"r_x2": 150.42,
"r_y2": 256.03,
"r_x3": 70.04,
"r_y3": 256.03,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes.",
"orig": "the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes."
},
{
"label": "text",
"id": 0,
"page_no": 11,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 279.2,
"r": 286.37,
"b": 395.71,
"coord_origin": "TOPLEFT"
},
"confidence": 0.977,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 288.11,
"r_x1": 286.36,
"r_y1": 288.11,
"r_x2": 286.36,
"r_y2": 279.2,
"r_x3": 62.07,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "However, it is possible to mitigate those limitations by",
"orig": "However, it is possible to mitigate those limitations by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.06,
"r_x1": 286.37,
"r_y1": 300.06,
"r_x2": 286.37,
"r_y2": 291.16,
"r_x3": 50.11,
"r_y3": 291.16,
"coord_origin": "TOPLEFT"
},
"text": "combining the TableFormer predictions with the informa-",
"orig": "combining the TableFormer predictions with the informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.02,
"r_x1": 286.37,
"r_y1": 312.02,
"r_x2": 286.37,
"r_y2": 303.11,
"r_x3": 50.11,
"r_y3": 303.11,
"coord_origin": "TOPLEFT"
},
"text": "tion already present inside a programmatic PDF document.",
"orig": "tion already present inside a programmatic PDF document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 323.97,
"r_x1": 286.37,
"r_y1": 323.97,
"r_x2": 286.37,
"r_y2": 315.07,
"r_x3": 50.11,
"r_y3": 315.07,
"coord_origin": "TOPLEFT"
},
"text": "More specifically, PDF documents can be seen as a se-",
"orig": "More specifically, PDF documents can be seen as a se-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 335.93,
"r_x1": 286.37,
"r_y1": 335.93,
"r_x2": 286.37,
"r_y2": 327.02,
"r_x3": 50.11,
"r_y3": 327.02,
"coord_origin": "TOPLEFT"
},
"text": "quence of PDF cells where each cell is described by its con-",
"orig": "quence of PDF cells where each cell is described by its con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 347.89,
"r_x1": 286.37,
"r_y1": 347.89,
"r_x2": 286.37,
"r_y2": 338.98,
"r_x3": 50.11,
"r_y3": 338.98,
"coord_origin": "TOPLEFT"
},
"text": "tent and bounding box. If we are able to associate the PDF",
"orig": "tent and bounding box. If we are able to associate the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.84,
"r_x1": 286.37,
"r_y1": 359.84,
"r_x2": 286.37,
"r_y2": 350.93,
"r_x3": 50.11,
"r_y3": 350.93,
"coord_origin": "TOPLEFT"
},
"text": "cells with the predicted table cells, we can directly link the",
"orig": "cells with the predicted table cells, we can directly link the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.8,
"r_x1": 286.37,
"r_y1": 371.8,
"r_x2": 286.37,
"r_y2": 362.89,
"r_x3": 50.11,
"r_y3": 362.89,
"coord_origin": "TOPLEFT"
},
"text": "PDF cell content to the table cell structure and use the PDF",
"orig": "PDF cell content to the table cell structure and use the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 383.75,
"r_x1": 286.37,
"r_y1": 383.75,
"r_x2": 286.37,
"r_y2": 374.84,
"r_x3": 50.11,
"r_y3": 374.84,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes to correct misalignments in the predicted",
"orig": "bounding boxes to correct misalignments in the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 395.71,
"r_x1": 154.56,
"r_y1": 395.71,
"r_x2": 154.56,
"r_y2": 386.8,
"r_x3": 50.11,
"r_y3": 386.8,
"coord_origin": "TOPLEFT"
},
"text": "table cell bounding boxes.",
"orig": "table cell bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes."
},
{
"label": "text",
"id": 11,
"page_no": 11,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 399.07,
"r": 286.36,
"b": 419.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.935,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 407.98,
"r_x1": 286.36,
"r_y1": 407.98,
"r_x2": 286.36,
"r_y2": 399.07,
"r_x3": 62.07,
"r_y3": 399.07,
"coord_origin": "TOPLEFT"
},
"text": "Here is a step-by-step description of the prediction post-",
"orig": "Here is a step-by-step description of the prediction post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 419.93,
"r_x1": 95.49,
"r_y1": 419.93,
"r_x2": 95.49,
"r_y2": 411.03,
"r_x3": 50.11,
"r_y3": 411.03,
"coord_origin": "TOPLEFT"
},
"text": "processing:",
"orig": "processing:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Here is a step-by-step description of the prediction postprocessing:"
},
{
"label": "list_item",
"id": 20,
"page_no": 11,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 423.3,
"r": 286.37,
"b": 456.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.828,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 432.2,
"r_x1": 69.37,
"r_y1": 432.2,
"r_x2": 69.37,
"r_y2": 423.3,
"r_x3": 62.07,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.81,
"r_y0": 432.2,
"r_x1": 286.37,
"r_y1": 432.2,
"r_x2": 286.37,
"r_y2": 423.3,
"r_x3": 71.81,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "Get the minimal grid dimensions - number of rows and",
"orig": "Get the minimal grid dimensions - number of rows and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 444.16,
"r_x1": 286.37,
"r_y1": 444.16,
"r_x2": 286.37,
"r_y2": 435.25,
"r_x3": 50.11,
"r_y3": 435.25,
"coord_origin": "TOPLEFT"
},
"text": "columns for the predicted table structure. This represents",
"orig": "columns for the predicted table structure. This represents",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 456.11,
"r_x1": 274.51,
"r_y1": 456.11,
"r_x2": 274.51,
"r_y2": 447.21,
"r_x3": 50.11,
"r_y3": 447.21,
"coord_origin": "TOPLEFT"
},
"text": "the most granular grid for the underlying table structure.",
"orig": "the most granular grid for the underlying table structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure."
},
{
"label": "list_item",
"id": 2,
"page_no": 11,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 459.48,
"r": 286.37,
"b": 504.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.965,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 468.38,
"r_x1": 69.54,
"r_y1": 468.38,
"r_x2": 69.54,
"r_y2": 459.48,
"r_x3": 62.07,
"r_y3": 459.48,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 77.43,
"r_y0": 468.38,
"r_x1": 286.36,
"r_y1": 468.38,
"r_x2": 286.36,
"r_y2": 459.48,
"r_x3": 77.43,
"r_y3": 459.48,
"coord_origin": "TOPLEFT"
},
"text": "Generate pair-wise matches between the bounding",
"orig": "Generate pair-wise matches between the bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 480.34,
"r_x1": 286.37,
"r_y1": 480.34,
"r_x2": 286.37,
"r_y2": 471.43,
"r_x3": 50.11,
"r_y3": 471.43,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the PDF cells and the predicted cells. The Intersec-",
"orig": "boxes of the PDF cells and the predicted cells. The Intersec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 492.29,
"r_x1": 286.37,
"r_y1": 492.29,
"r_x2": 286.37,
"r_y2": 483.39,
"r_x3": 50.11,
"r_y3": 483.39,
"coord_origin": "TOPLEFT"
},
"text": "tion Over Union (IOU) metric is used to evaluate the quality",
"orig": "tion Over Union (IOU) metric is used to evaluate the quality",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 504.25,
"r_x1": 110.7,
"r_y1": 504.25,
"r_x2": 110.7,
"r_y2": 495.34,
"r_x3": 50.11,
"r_y3": 495.34,
"coord_origin": "TOPLEFT"
},
"text": "of the matches.",
"orig": "of the matches.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches."
},
{
"label": "list_item",
"id": 10,
"page_no": 11,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 507.61,
"r": 286.36,
"b": 528.47,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 516.52,
"r_x1": 69.86,
"r_y1": 516.52,
"r_x2": 69.86,
"r_y2": 507.61,
"r_x3": 62.07,
"r_y3": 507.61,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.46,
"r_y0": 516.52,
"r_x1": 286.36,
"r_y1": 516.52,
"r_x2": 286.36,
"r_y2": 507.61,
"r_x3": 72.46,
"r_y3": 507.61,
"coord_origin": "TOPLEFT"
},
"text": "Use a carefully selected IOU threshold to designate",
"orig": "Use a carefully selected IOU threshold to designate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 528.47,
"r_x1": 226.07,
"r_y1": 528.47,
"r_x2": 226.07,
"r_y2": 519.57,
"r_x3": 50.11,
"r_y3": 519.57,
"coord_origin": "TOPLEFT"
},
"text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Use a carefully selected IOU threshold to designate the matches as \"good\" ones and \"bad\" ones."
},
{
"label": "list_item",
"id": 8,
"page_no": 11,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 531.84,
"r": 286.37,
"b": 564.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.949,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 540.74,
"r_x1": 286.36,
"r_y1": 540.74,
"r_x2": 286.36,
"r_y2": 531.84,
"r_x3": 62.07,
"r_y3": 531.84,
"coord_origin": "TOPLEFT"
},
"text": "3.a. If all IOU scores in a column are below the thresh-",
"orig": "3.a. If all IOU scores in a column are below the thresh-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 552.7,
"r_x1": 286.37,
"r_y1": 552.7,
"r_x2": 286.37,
"r_y2": 543.79,
"r_x3": 50.11,
"r_y3": 543.79,
"coord_origin": "TOPLEFT"
},
"text": "old, discard all predictions (structure and bounding boxes)",
"orig": "old, discard all predictions (structure and bounding boxes)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 564.65,
"r_x1": 114.03,
"r_y1": 564.65,
"r_x2": 114.03,
"r_y2": 555.75,
"r_x3": 50.11,
"r_y3": 555.75,
"coord_origin": "TOPLEFT"
},
"text": "for that column.",
"orig": "for that column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column."
},
{
"label": "list_item",
"id": 5,
"page_no": 11,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 568.02,
"r": 286.37,
"b": 600.83,
"coord_origin": "TOPLEFT"
},
"confidence": 0.959,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 576.92,
"r_x1": 69.54,
"r_y1": 576.92,
"r_x2": 69.54,
"r_y2": 568.02,
"r_x3": 62.07,
"r_y3": 568.02,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.73,
"r_y0": 576.92,
"r_x1": 286.37,
"r_y1": 576.92,
"r_x2": 286.37,
"r_y2": 568.02,
"r_x3": 76.73,
"r_y3": 568.02,
"coord_origin": "TOPLEFT"
},
"text": "Find the best-fitting content alignment for the pre-",
"orig": "Find the best-fitting content alignment for the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 588.88,
"r_x1": 286.37,
"r_y1": 588.88,
"r_x2": 286.37,
"r_y2": 579.97,
"r_x3": 50.11,
"r_y3": 579.97,
"coord_origin": "TOPLEFT"
},
"text": "dicted cells with good IOU per each column. The alignment",
"orig": "dicted cells with good IOU per each column. The alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 600.83,
"r_x1": 278.7,
"r_y1": 600.83,
"r_x2": 278.7,
"r_y2": 591.93,
"r_x3": 50.11,
"r_y3": 591.93,
"coord_origin": "TOPLEFT"
},
"text": "of the column can be identified by the following formula:",
"orig": "of the column can be identified by the following formula:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:"
},
{
"label": "formula",
"id": 12,
"page_no": 11,
"cluster": {
"id": 12,
"label": "formula",
"bbox": {
"l": 110.7,
"t": 623.44,
"r": 286.36,
"b": 654.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.03,
"r_y0": 632.84,
"r_x1": 157.95,
"r_y1": 632.84,
"r_x2": 157.95,
"r_y2": 623.99,
"r_x3": 112.03,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "alignment",
"orig": "alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.72,
"r_y0": 632.84,
"r_x1": 203.5,
"r_y1": 632.84,
"r_x2": 203.5,
"r_y2": 623.99,
"r_x3": 160.72,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "= arg min",
"orig": "= arg min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.58,
"r_y0": 640.18,
"r_x1": 189.15,
"r_y1": 640.18,
"r_x2": 189.15,
"r_y2": 633.98,
"r_x3": 185.58,
"r_y3": 633.98,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 203.5,
"r_y0": 632.84,
"r_x1": 208.48,
"r_y1": 632.84,
"r_x2": 208.48,
"r_y2": 623.44,
"r_x3": 203.5,
"r_y3": 623.44,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.48,
"r_y0": 632.84,
"r_x1": 220.29,
"r_y1": 632.84,
"r_x2": 220.29,
"r_y2": 623.99,
"r_x3": 208.48,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.79,
"r_y0": 632.84,
"r_x1": 225.77,
"r_y1": 632.84,
"r_x2": 225.77,
"r_y2": 623.44,
"r_x3": 220.79,
"r_y3": 623.44,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 654.11,
"r_x1": 122.51,
"r_y1": 654.11,
"r_x2": 122.51,
"r_y2": 645.26,
"r_x3": 110.7,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.78,
"r_y0": 654.11,
"r_x1": 133.53,
"r_y1": 654.11,
"r_x2": 133.53,
"r_y2": 645.26,
"r_x3": 125.78,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 136.29,
"r_y0": 654.11,
"r_x1": 156.0,
"r_y1": 654.11,
"r_x2": 156.0,
"r_y2": 645.26,
"r_x3": 136.29,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "max",
"orig": "max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 654.11,
"r_x1": 160.98,
"r_y1": 654.11,
"r_x2": 160.98,
"r_y2": 644.7,
"r_x3": 156.0,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.98,
"r_y0": 654.11,
"r_x1": 170.24,
"r_y1": 654.11,
"r_x2": 170.24,
"r_y2": 645.26,
"r_x3": 160.98,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.74,
"r_y0": 654.11,
"r_x1": 185.68,
"r_y1": 654.11,
"r_x2": 185.68,
"r_y2": 644.7,
"r_x3": 170.74,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "} \u2212",
"orig": "} \u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.89,
"r_y0": 654.11,
"r_x1": 206.05,
"r_y1": 654.11,
"r_x2": 206.05,
"r_y2": 645.26,
"r_x3": 187.89,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "min",
"orig": "min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.05,
"r_y0": 654.11,
"r_x1": 211.04,
"r_y1": 654.11,
"r_x2": 211.04,
"r_y2": 644.7,
"r_x3": 206.05,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.03,
"r_y0": 654.11,
"r_x1": 220.29,
"r_y1": 654.11,
"r_x2": 220.29,
"r_y2": 645.26,
"r_x3": 211.03,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.79,
"r_y0": 654.11,
"r_x1": 225.77,
"r_y1": 654.11,
"r_x2": 225.77,
"r_y2": 644.7,
"r_x3": 220.79,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 643.79,
"r_x1": 286.36,
"r_y1": 643.79,
"r_x2": 286.36,
"r_y2": 634.89,
"r_x3": 274.75,
"r_y3": 634.89,
"coord_origin": "TOPLEFT"
},
"text": "(4)",
"orig": "(4)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "alignment = arg min c { D$_{c}$ } D$_{c}$ = max { x$_{c}$ } \u2212 min { x$_{c}$ } (4)"
},
{
"label": "text",
"id": 7,
"page_no": 11,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 667.35,
"r": 286.36,
"b": 688.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 676.97,
"r_x1": 74.45,
"r_y1": 676.97,
"r_x2": 74.45,
"r_y2": 668.07,
"r_x3": 50.11,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.34,
"r_y0": 676.75,
"r_x1": 82.65,
"r_y1": 676.75,
"r_x2": 82.65,
"r_y2": 667.91,
"r_x3": 78.34,
"r_y3": 667.91,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.53,
"r_y0": 676.97,
"r_x1": 123.63,
"r_y1": 676.97,
"r_x2": 123.63,
"r_y2": 668.07,
"r_x3": 86.53,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "is one of",
"orig": "is one of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 127.52,
"r_y0": 676.75,
"r_x1": 132.5,
"r_y1": 676.75,
"r_x2": 132.5,
"r_y2": 667.35,
"r_x3": 127.52,
"r_y3": 667.35,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.5,
"r_y0": 676.97,
"r_x1": 210.7,
"r_y1": 676.97,
"r_x2": 210.7,
"r_y2": 668.07,
"r_x3": 132.5,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "left, centroid, right",
"orig": "left, centroid, right",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.7,
"r_y0": 676.75,
"r_x1": 215.68,
"r_y1": 676.75,
"r_x2": 215.68,
"r_y2": 667.35,
"r_x3": 210.7,
"r_y3": 667.35,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.56,
"r_y0": 676.97,
"r_x1": 233.95,
"r_y1": 676.97,
"r_x2": 233.95,
"r_y2": 668.07,
"r_x3": 219.56,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 237.83,
"r_y0": 676.75,
"r_x1": 247.09,
"r_y1": 676.75,
"r_x2": 247.09,
"r_y2": 667.91,
"r_x3": 237.83,
"r_y3": 667.91,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.47,
"r_y0": 676.97,
"r_x1": 286.36,
"r_y1": 676.97,
"r_x2": 286.36,
"r_y2": 668.07,
"r_x3": 251.47,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "is the x-",
"orig": "is the x-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 688.93,
"r_x1": 205.89,
"r_y1": 688.93,
"r_x2": 205.89,
"r_y2": 680.02,
"r_x3": 50.11,
"r_y3": 680.02,
"coord_origin": "TOPLEFT"
},
"text": "coordinate for the corresponding point.",
"orig": "coordinate for the corresponding point.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where c is one of { left, centroid, right } and x$_{c}$ is the xcoordinate for the corresponding point."
},
{
"label": "list_item",
"id": 13,
"page_no": 11,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 692.29,
"r": 286.36,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 701.2,
"r_x1": 69.54,
"r_y1": 701.2,
"r_x2": 69.54,
"r_y2": 692.29,
"r_x3": 62.07,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.27,
"r_y0": 701.2,
"r_x1": 286.36,
"r_y1": 701.2,
"r_x2": 286.36,
"r_y2": 692.29,
"r_x3": 76.27,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Use the alignment computed in step 4, to compute",
"orig": "Use the alignment computed in step 4, to compute",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 94.6,
"r_y1": 713.15,
"r_x2": 94.6,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "the median",
"orig": "the median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.6,
"r_y0": 712.93,
"r_x1": 103.29,
"r_y1": 712.93,
"r_x2": 103.29,
"r_y2": 704.09,
"r_x3": 97.6,
"r_y3": 704.09,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.29,
"r_y0": 713.15,
"r_x1": 286.36,
"r_y1": 713.15,
"r_x2": 286.36,
"r_y2": 704.25,
"r_x3": 103.29,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "-coordinate for all table columns and the me-",
"orig": "-coordinate for all table columns and the me-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-"
},
{
"label": "text",
"id": 16,
"page_no": 11,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 308.86,
"t": 210.93,
"r": 545.12,
"b": 255.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.894,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 219.84,
"r_x1": 545.12,
"r_y1": 219.84,
"r_x2": 545.12,
"r_y2": 210.93,
"r_x3": 308.86,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "dian cell size for all table cells. The usage of median dur-",
"orig": "dian cell size for all table cells. The usage of median dur-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 231.79,
"r_x1": 545.12,
"r_y1": 231.79,
"r_x2": 545.12,
"r_y2": 222.89,
"r_x3": 308.86,
"r_y3": 222.89,
"coord_origin": "TOPLEFT"
},
"text": "ing the computations, helps to eliminate outliers caused by",
"orig": "ing the computations, helps to eliminate outliers caused by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 243.75,
"r_x1": 545.12,
"r_y1": 243.75,
"r_x2": 545.12,
"r_y2": 234.84,
"r_x3": 308.86,
"r_y3": 234.84,
"coord_origin": "TOPLEFT"
},
"text": "occasional column spans which are usually wider than the",
"orig": "occasional column spans which are usually wider than the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 255.7,
"r_x1": 339.58,
"r_y1": 255.7,
"r_x2": 339.58,
"r_y2": 246.8,
"r_x3": 308.86,
"r_y3": 246.8,
"coord_origin": "TOPLEFT"
},
"text": "normal.",
"orig": "normal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal."
},
{
"label": "list_item",
"id": 9,
"page_no": 11,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 259.1,
"r": 545.11,
"b": 279.96,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 268.01,
"r_x1": 328.29,
"r_y1": 268.01,
"r_x2": 328.29,
"r_y2": 259.1,
"r_x3": 320.82,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 334.88,
"r_y0": 268.01,
"r_x1": 545.11,
"r_y1": 268.01,
"r_x2": 545.11,
"r_y2": 259.1,
"r_x3": 334.88,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "Snap all cells with bad IOU to their corresponding",
"orig": "Snap all cells with bad IOU to their corresponding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 279.96,
"r_x1": 338.19,
"r_y1": 279.96,
"r_x2": 338.19,
"r_y2": 271.06,
"r_x3": 308.86,
"r_y3": 271.06,
"coord_origin": "TOPLEFT"
},
"text": "median",
"orig": "median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 340.68,
"r_y0": 279.74,
"r_x1": 346.38,
"r_y1": 279.74,
"r_x2": 346.38,
"r_y2": 270.9,
"r_x3": 340.68,
"r_y3": 270.9,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.38,
"r_y0": 279.96,
"r_x1": 453.72,
"r_y1": 279.96,
"r_x2": 453.72,
"r_y2": 271.06,
"r_x3": 346.38,
"r_y3": 271.06,
"coord_origin": "TOPLEFT"
},
"text": "-coordinates and cell sizes.",
"orig": "-coordinates and cell sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes."
},
{
"label": "list_item",
"id": 6,
"page_no": 11,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 283.36,
"r": 545.12,
"b": 387.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 292.27,
"r_x1": 328.39,
"r_y1": 292.27,
"r_x2": 328.39,
"r_y2": 283.36,
"r_x3": 320.82,
"r_y3": 283.36,
"coord_origin": "TOPLEFT"
},
"text": "7.",
"orig": "7.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.91,
"r_y0": 292.27,
"r_x1": 545.11,
"r_y1": 292.27,
"r_x2": 545.11,
"r_y2": 283.36,
"r_x3": 330.91,
"r_y3": 283.36,
"coord_origin": "TOPLEFT"
},
"text": "Generate a new set of pair-wise matches between the",
"orig": "Generate a new set of pair-wise matches between the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.22,
"r_x1": 545.12,
"r_y1": 304.22,
"r_x2": 545.12,
"r_y2": 295.32,
"r_x3": 308.86,
"r_y3": 295.32,
"coord_origin": "TOPLEFT"
},
"text": "corrected bounding boxes and PDF cells. This time use a",
"orig": "corrected bounding boxes and PDF cells. This time use a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.18,
"r_x1": 545.12,
"r_y1": 316.18,
"r_x2": 545.12,
"r_y2": 307.27,
"r_x3": 308.86,
"r_y3": 307.27,
"coord_origin": "TOPLEFT"
},
"text": "modified version of the IOU metric, where the area of the",
"orig": "modified version of the IOU metric, where the area of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 328.13,
"r_x1": 545.12,
"r_y1": 328.13,
"r_x2": 545.12,
"r_y2": 319.23,
"r_x3": 308.86,
"r_y3": 319.23,
"coord_origin": "TOPLEFT"
},
"text": "intersection between the predicted and PDF cells is divided",
"orig": "intersection between the predicted and PDF cells is divided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 340.09,
"r_x1": 397.19,
"r_y1": 340.09,
"r_x2": 397.19,
"r_y2": 331.18,
"r_x3": 308.86,
"r_y3": 331.18,
"coord_origin": "TOPLEFT"
},
"text": "by the PDF cell area.",
"orig": "by the PDF cell area.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.66,
"r_y0": 340.09,
"r_x1": 545.12,
"r_y1": 340.09,
"r_x2": 545.12,
"r_y2": 331.18,
"r_x3": 403.66,
"r_y3": 331.18,
"coord_origin": "TOPLEFT"
},
"text": "In case there are multiple matches",
"orig": "In case there are multiple matches",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 352.05,
"r_x1": 545.12,
"r_y1": 352.05,
"r_x2": 545.12,
"r_y2": 343.14,
"r_x3": 308.86,
"r_y3": 343.14,
"coord_origin": "TOPLEFT"
},
"text": "for the same PDF cell, the prediction with the higher score",
"orig": "for the same PDF cell, the prediction with the higher score",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 364.0,
"r_x1": 545.12,
"r_y1": 364.0,
"r_x2": 545.12,
"r_y2": 355.09,
"r_x3": 308.86,
"r_y3": 355.09,
"coord_origin": "TOPLEFT"
},
"text": "is preferred. This covers the cases where the PDF cells are",
"orig": "is preferred. This covers the cases where the PDF cells are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 375.96,
"r_x1": 545.12,
"r_y1": 375.96,
"r_x2": 545.12,
"r_y2": 367.05,
"r_x3": 308.86,
"r_y3": 367.05,
"coord_origin": "TOPLEFT"
},
"text": "smaller than the area of predicted or corrected prediction",
"orig": "smaller than the area of predicted or corrected prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 387.91,
"r_x1": 329.61,
"r_y1": 387.91,
"r_x2": 329.61,
"r_y2": 379.0,
"r_x3": 308.86,
"r_y3": 379.0,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells."
},
{
"label": "list_item",
"id": 17,
"page_no": 11,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 391.31,
"r": 545.12,
"b": 459.99,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 400.22,
"r_x1": 328.55,
"r_y1": 400.22,
"r_x2": 328.55,
"r_y2": 391.31,
"r_x3": 320.82,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "8.",
"orig": "8.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.13,
"r_y0": 400.22,
"r_x1": 545.12,
"r_y1": 400.22,
"r_x2": 545.12,
"r_y2": 391.31,
"r_x3": 331.13,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "In some rare occasions, we have noticed that Table-",
"orig": "In some rare occasions, we have noticed that Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.17,
"r_x1": 545.12,
"r_y1": 412.17,
"r_x2": 545.12,
"r_y2": 403.27,
"r_x3": 308.86,
"r_y3": 403.27,
"coord_origin": "TOPLEFT"
},
"text": "Former can confuse a single column as two. When the post-",
"orig": "Former can confuse a single column as two. When the post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.13,
"r_x1": 545.12,
"r_y1": 424.13,
"r_x2": 545.12,
"r_y2": 415.22,
"r_x3": 308.86,
"r_y3": 415.22,
"coord_origin": "TOPLEFT"
},
"text": "processing steps are applied, this results with two predicted",
"orig": "processing steps are applied, this results with two predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.08,
"r_x1": 545.12,
"r_y1": 436.08,
"r_x2": 545.12,
"r_y2": 427.18,
"r_x3": 308.86,
"r_y3": 427.18,
"coord_origin": "TOPLEFT"
},
"text": "columns pointing to the same PDF column. In such case",
"orig": "columns pointing to the same PDF column. In such case",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.04,
"r_x1": 545.12,
"r_y1": 448.04,
"r_x2": 545.12,
"r_y2": 439.13,
"r_x3": 308.86,
"r_y3": 439.13,
"coord_origin": "TOPLEFT"
},
"text": "we must de-duplicate the columns according to highest to-",
"orig": "we must de-duplicate the columns according to highest to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 459.99,
"r_x1": 426.18,
"r_y1": 459.99,
"r_x2": 426.18,
"r_y2": 451.09,
"r_x3": 308.86,
"r_y3": 451.09,
"coord_origin": "TOPLEFT"
},
"text": "tal column intersection score.",
"orig": "tal column intersection score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score."
},
{
"label": "list_item",
"id": 15,
"page_no": 11,
"cluster": {
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 463.39,
"r": 545.12,
"b": 567.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 472.3,
"r_x1": 328.67,
"r_y1": 472.3,
"r_x2": 328.67,
"r_y2": 463.39,
"r_x3": 320.82,
"r_y3": 463.39,
"coord_origin": "TOPLEFT"
},
"text": "9.",
"orig": "9.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.29,
"r_y0": 472.3,
"r_x1": 545.11,
"r_y1": 472.3,
"r_x2": 545.11,
"r_y2": 463.39,
"r_x3": 331.29,
"r_y3": 463.39,
"coord_origin": "TOPLEFT"
},
"text": "Pick up the remaining orphan cells. There could be",
"orig": "Pick up the remaining orphan cells. There could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 484.25,
"r_x1": 545.12,
"r_y1": 484.25,
"r_x2": 545.12,
"r_y2": 475.35,
"r_x3": 308.86,
"r_y3": 475.35,
"coord_origin": "TOPLEFT"
},
"text": "cases, when after applying all the previous post-processing",
"orig": "cases, when after applying all the previous post-processing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 496.21,
"r_x1": 545.12,
"r_y1": 496.21,
"r_x2": 545.12,
"r_y2": 487.3,
"r_x3": 308.86,
"r_y3": 487.3,
"coord_origin": "TOPLEFT"
},
"text": "steps, some PDF cells could still remain without any match",
"orig": "steps, some PDF cells could still remain without any match",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 508.16,
"r_x1": 381.9,
"r_y1": 508.16,
"r_x2": 381.9,
"r_y2": 499.26,
"r_x3": 308.86,
"r_y3": 499.26,
"coord_origin": "TOPLEFT"
},
"text": "to predicted cells.",
"orig": "to predicted cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 508.16,
"r_x1": 545.12,
"r_y1": 508.16,
"r_x2": 545.12,
"r_y2": 499.26,
"r_x3": 388.7,
"r_y3": 499.26,
"coord_origin": "TOPLEFT"
},
"text": "However, it is still possible to deduce",
"orig": "However, it is still possible to deduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 520.12,
"r_x1": 545.12,
"r_y1": 520.12,
"r_x2": 545.12,
"r_y2": 511.21,
"r_x3": 308.86,
"r_y3": 511.21,
"coord_origin": "TOPLEFT"
},
"text": "the correct matching for an orphan PDF cell by mapping its",
"orig": "the correct matching for an orphan PDF cell by mapping its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 532.07,
"r_x1": 545.12,
"r_y1": 532.07,
"r_x2": 545.12,
"r_y2": 523.17,
"r_x3": 308.86,
"r_y3": 523.17,
"coord_origin": "TOPLEFT"
},
"text": "bounding box on the geometry of the grid. This mapping",
"orig": "bounding box on the geometry of the grid. This mapping",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 544.03,
"r_x1": 545.11,
"r_y1": 544.03,
"r_x2": 545.11,
"r_y2": 535.12,
"r_x3": 308.86,
"r_y3": 535.12,
"coord_origin": "TOPLEFT"
},
"text": "decides if the content of the orphan cell will be appended to",
"orig": "decides if the content of the orphan cell will be appended to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 555.98,
"r_x1": 545.12,
"r_y1": 555.98,
"r_x2": 545.12,
"r_y2": 547.08,
"r_x3": 308.86,
"r_y3": 547.08,
"coord_origin": "TOPLEFT"
},
"text": "an already matched table cell, or a new table cell should be",
"orig": "an already matched table cell, or a new table cell should be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 567.94,
"r_x1": 442.22,
"r_y1": 567.94,
"r_x2": 442.22,
"r_y2": 559.03,
"r_x3": 308.86,
"r_y3": 559.03,
"coord_origin": "TOPLEFT"
},
"text": "created to match with the orphan.",
"orig": "created to match with the orphan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan."
},
{
"label": "text",
"id": 19,
"page_no": 11,
"cluster": {
"id": 19,
"label": "text",
"bbox": {
"l": 308.86,
"t": 571.34,
"r": 545.12,
"b": 604.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.846,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 580.24,
"r_x1": 545.11,
"r_y1": 580.24,
"r_x2": 545.11,
"r_y2": 571.34,
"r_x3": 320.82,
"r_y3": 571.34,
"coord_origin": "TOPLEFT"
},
"text": "9a. Compute the top and bottom boundary of the hori-",
"orig": "9a. Compute the top and bottom boundary of the hori-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 592.2,
"r_x1": 471.64,
"r_y1": 592.2,
"r_x2": 471.64,
"r_y2": 583.29,
"r_x3": 308.86,
"r_y3": 583.29,
"coord_origin": "TOPLEFT"
},
"text": "zontal band for each grid row (min/max",
"orig": "zontal band for each grid row (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.83,
"r_y0": 591.98,
"r_x1": 479.72,
"r_y1": 591.98,
"r_x2": 479.72,
"r_y2": 583.13,
"r_x3": 474.83,
"r_y3": 583.13,
"coord_origin": "TOPLEFT"
},
"text": "y",
"orig": "y",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.27,
"r_y0": 592.2,
"r_x1": 545.12,
"r_y1": 592.2,
"r_x2": 545.12,
"r_y2": 583.29,
"r_x3": 483.27,
"r_y3": 583.29,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per",
"orig": "coordinates per",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 604.15,
"r_x1": 329.91,
"r_y1": 604.15,
"r_x2": 329.91,
"r_y2": 595.25,
"r_x3": 308.86,
"r_y3": 595.25,
"coord_origin": "TOPLEFT"
},
"text": "row).",
"orig": "row).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)."
},
{
"label": "list_item",
"id": 21,
"page_no": 11,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 607.55,
"r": 545.12,
"b": 628.42,
"coord_origin": "TOPLEFT"
},
"confidence": 0.772,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 616.46,
"r_x1": 332.87,
"r_y1": 616.46,
"r_x2": 332.87,
"r_y2": 607.55,
"r_x3": 320.82,
"r_y3": 607.55,
"coord_origin": "TOPLEFT"
},
"text": "9b.",
"orig": "9b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.93,
"r_y0": 616.46,
"r_x1": 545.12,
"r_y1": 616.46,
"r_x2": 545.12,
"r_y2": 607.55,
"r_x3": 339.93,
"r_y3": 607.55,
"coord_origin": "TOPLEFT"
},
"text": "Intersect the orphan\u2019s bounding box with the row",
"orig": "Intersect the orphan\u2019s bounding box with the row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 628.42,
"r_x1": 495.29,
"r_y1": 628.42,
"r_x2": 495.29,
"r_y2": 619.51,
"r_x3": 308.86,
"r_y3": 619.51,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid row.",
"orig": "bands, and map the cell to the closest grid row.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row."
},
{
"label": "list_item",
"id": 18,
"page_no": 11,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 631.81,
"r": 545.12,
"b": 664.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.858,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 640.72,
"r_x1": 545.12,
"r_y1": 640.72,
"r_x2": 545.12,
"r_y2": 631.81,
"r_x3": 320.82,
"r_y3": 631.81,
"coord_origin": "TOPLEFT"
},
"text": "9c. Compute the left and right boundary of the vertical",
"orig": "9c. Compute the left and right boundary of the vertical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 652.68,
"r_x1": 455.28,
"r_y1": 652.68,
"r_x2": 455.28,
"r_y2": 643.77,
"r_x3": 308.86,
"r_y3": 643.77,
"coord_origin": "TOPLEFT"
},
"text": "band for each grid column (min/max",
"orig": "band for each grid column (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 457.78,
"r_y0": 652.46,
"r_x1": 463.47,
"r_y1": 652.46,
"r_x2": 463.47,
"r_y2": 643.61,
"r_x3": 457.78,
"r_y3": 643.61,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.97,
"r_y0": 652.68,
"r_x1": 545.11,
"r_y1": 652.68,
"r_x2": 545.11,
"r_y2": 643.77,
"r_x3": 465.97,
"r_y3": 643.77,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per col-",
"orig": "coordinates per col-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 664.63,
"r_x1": 332.38,
"r_y1": 664.63,
"r_x2": 332.38,
"r_y2": 655.72,
"r_x3": 308.86,
"r_y3": 655.72,
"coord_origin": "TOPLEFT"
},
"text": "umn).",
"orig": "umn).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)."
},
{
"label": "list_item",
"id": 22,
"page_no": 11,
"cluster": {
"id": 22,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 668.03,
"r": 545.11,
"b": 688.89,
"coord_origin": "TOPLEFT"
},
"confidence": 0.759,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 676.94,
"r_x1": 545.11,
"r_y1": 676.94,
"r_x2": 545.11,
"r_y2": 668.03,
"r_x3": 320.82,
"r_y3": 668.03,
"coord_origin": "TOPLEFT"
},
"text": "9d. Intersect the orphan\u2019s bounding box with the column",
"orig": "9d. Intersect the orphan\u2019s bounding box with the column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 688.89,
"r_x1": 510.58,
"r_y1": 688.89,
"r_x2": 510.58,
"r_y2": 679.99,
"r_x3": 308.86,
"r_y3": 679.99,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid column.",
"orig": "bands, and map the cell to the closest grid column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column."
},
{
"label": "list_item",
"id": 25,
"page_no": 11,
"cluster": {
"id": 25,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 692.29,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.697,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 320.82,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "9e. If the table cell under the identified row and column",
"orig": "9e. If the table cell under the identified row and column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "is not empty, extend its content with the content of the or-",
"orig": "is not empty, extend its content with the content of the or-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-"
},
{
"label": "page_footer",
"id": 14,
"page_no": 11,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "12"
}
],
"body": [
{
"label": "picture",
"id": 30,
"page_no": 11,
"cluster": {
"id": 30,
"label": "picture",
"bbox": {
"l": 53.54,
"t": 74.75,
"r": 544.94,
"b": 147.59,
"coord_origin": "TOPLEFT"
},
"confidence": 0.603,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.39,
"r_y0": 83.26,
"r_x1": 151.95,
"r_y1": 83.26,
"r_x2": 151.95,
"r_y2": 77.31,
"r_x3": 119.39,
"r_y3": 77.31,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.35,
"r_y0": 81.14,
"r_x1": 59.33,
"r_y1": 81.14,
"r_x2": 59.33,
"r_y2": 75.19,
"r_x3": 53.35,
"r_y3": 75.19,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.58,
"r_y0": 83.41,
"r_x1": 319.83,
"r_y1": 83.41,
"r_x2": 319.83,
"r_y2": 77.46,
"r_x3": 289.58,
"r_y3": 77.46,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.37,
"r_y0": 83.2,
"r_x1": 481.76,
"r_y1": 83.2,
"r_x2": 481.76,
"r_y2": 77.25,
"r_x3": 448.37,
"r_y3": 77.25,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.55,
"r_y0": 146.23,
"r_x1": 94.98,
"r_y1": 146.23,
"r_x2": 94.98,
"r_y2": 141.28,
"r_x3": 82.55,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.04,
"r_y0": 106.06,
"r_x1": 85.29,
"r_y1": 106.06,
"r_x2": 85.29,
"r_y2": 101.1,
"r_x3": 63.04,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 129.35,
"r_x1": 85.23,
"r_y1": 129.35,
"r_x2": 85.23,
"r_y2": 124.4,
"r_x3": 67.77,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.55,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.54,
"r_x3": 227.55,
"r_y3": 102.54,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.94,
"r_x1": 249.66,
"r_y1": 131.94,
"r_x2": 249.66,
"r_y2": 126.99,
"r_x3": 232.2,
"r_y3": 126.99,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.23,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.05,
"r_x3": 396.23,
"r_y3": 114.05,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.38,
"r_y0": 146.23,
"r_x1": 105.08,
"r_y1": 146.23,
"r_x2": 105.08,
"r_y2": 141.28,
"r_x3": 97.38,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.94,
"r_y0": 90.69,
"r_x1": 76.15,
"r_y1": 90.69,
"r_x2": 76.15,
"r_y2": 85.73,
"r_x3": 60.94,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.18,
"r_x1": 106.99,
"r_y1": 91.18,
"r_x2": 106.99,
"r_y2": 86.22,
"r_x3": 82.3,
"r_y3": 86.22,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.21,
"r_y0": 146.56,
"r_x1": 281.88,
"r_y1": 146.56,
"r_x2": 281.88,
"r_y2": 141.61,
"r_x3": 246.21,
"r_y3": 141.61,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.69,
"r_x1": 241.91,
"r_y1": 90.69,
"r_x2": 241.91,
"r_y2": 85.73,
"r_x3": 226.7,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.94,
"r_y0": 91.05,
"r_x1": 282.49,
"r_y1": 91.05,
"r_x2": 282.49,
"r_y2": 86.09,
"r_x3": 249.94,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.19,
"r_y0": 146.23,
"r_x1": 444.69,
"r_y1": 146.23,
"r_x2": 444.69,
"r_y2": 141.28,
"r_x3": 410.19,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 90.69,
"r_x1": 432.67,
"r_y1": 90.69,
"r_x2": 432.67,
"r_y2": 85.73,
"r_x3": 391.37,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.61,
"r_y0": 91.22,
"r_x1": 445.62,
"r_y1": 91.22,
"r_x2": 445.62,
"r_y2": 86.26,
"r_x3": 435.61,
"r_y3": 86.26,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.95,
"r_y0": 146.25,
"r_x1": 136.2,
"r_y1": 146.25,
"r_x2": 136.2,
"r_y2": 141.29,
"r_x3": 113.95,
"r_y3": 141.29,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.92,
"r_y0": 99.78,
"r_x1": 127.05,
"r_y1": 99.78,
"r_x2": 127.05,
"r_y2": 94.82,
"r_x3": 116.92,
"r_y3": 94.82,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.31,
"r_y0": 105.9,
"r_x1": 127.05,
"r_y1": 105.9,
"r_x2": 127.05,
"r_y2": 100.94,
"r_x3": 113.31,
"r_y3": 100.94,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.94,
"r_y0": 112.02,
"r_x1": 127.06,
"r_y1": 112.02,
"r_x2": 127.06,
"r_y2": 107.06,
"r_x3": 112.94,
"r_y3": 107.06,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.23,
"r_y0": 127.57,
"r_x1": 126.97,
"r_y1": 127.57,
"r_x2": 126.97,
"r_y2": 122.62,
"r_x3": 113.23,
"r_y3": 122.62,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.85,
"r_y0": 133.69,
"r_x1": 126.97,
"r_y1": 133.69,
"r_x2": 126.97,
"r_y2": 128.74,
"r_x3": 112.85,
"r_y3": 128.74,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.58,
"r_y0": 146.39,
"r_x1": 156.04,
"r_y1": 146.39,
"r_x2": 156.04,
"r_y2": 141.44,
"r_x3": 138.58,
"r_y3": 141.44,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.03,
"r_y0": 91.23,
"r_x1": 151.04,
"r_y1": 91.23,
"r_x2": 151.04,
"r_y2": 86.27,
"r_x3": 122.03,
"r_y3": 86.27,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.65,
"r_y0": 91.51,
"r_x1": 321.67,
"r_y1": 91.51,
"r_x2": 321.67,
"r_y2": 86.55,
"r_x3": 311.65,
"r_y3": 86.55,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.89,
"r_y0": 146.67,
"r_x1": 310.15,
"r_y1": 146.67,
"r_x2": 310.15,
"r_y2": 141.71,
"r_x3": 287.89,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.24,
"r_y0": 98.04,
"r_x1": 299.37,
"r_y1": 98.04,
"r_x2": 299.37,
"r_y2": 93.08,
"r_x3": 289.24,
"r_y3": 93.08,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.64,
"r_y0": 104.16,
"r_x1": 299.37,
"r_y1": 104.16,
"r_x2": 299.37,
"r_y2": 99.2,
"r_x3": 285.64,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.26,
"r_y0": 110.28,
"r_x1": 299.38,
"r_y1": 110.28,
"r_x2": 299.38,
"r_y2": 105.32,
"r_x3": 285.26,
"r_y3": 105.32,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.43,
"r_y0": 125.35,
"r_x1": 299.17,
"r_y1": 125.35,
"r_x2": 299.17,
"r_y2": 120.39,
"r_x3": 285.43,
"r_y3": 120.39,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.06,
"r_y0": 131.47,
"r_x1": 299.17,
"r_y1": 131.47,
"r_x2": 299.17,
"r_y2": 126.51,
"r_x3": 285.06,
"r_y3": 126.51,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.35,
"r_y0": 146.67,
"r_x1": 328.81,
"r_y1": 146.67,
"r_x2": 328.81,
"r_y2": 141.71,
"r_x3": 311.35,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.58,
"r_y0": 91.65,
"r_x1": 309.6,
"r_y1": 91.65,
"r_x2": 309.6,
"r_y2": 86.69,
"r_x3": 299.58,
"r_y3": 86.69,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.04,
"r_y0": 146.63,
"r_x1": 483.5,
"r_y1": 146.63,
"r_x2": 483.5,
"r_y2": 141.67,
"r_x3": 466.04,
"r_y3": 141.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.02,
"r_y0": 98.72,
"r_x1": 469.16,
"r_y1": 98.72,
"r_x2": 469.16,
"r_y2": 93.76,
"r_x3": 459.02,
"r_y3": 93.76,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.42,
"r_y0": 104.84,
"r_x1": 469.16,
"r_y1": 104.84,
"r_x2": 469.16,
"r_y2": 99.88,
"r_x3": 455.42,
"r_y3": 99.88,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.05,
"r_y0": 110.96,
"r_x1": 469.16,
"r_y1": 110.96,
"r_x2": 469.16,
"r_y2": 106.0,
"r_x3": 455.05,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.39,
"r_y0": 90.53,
"r_x1": 480.65,
"r_y1": 90.53,
"r_x2": 480.65,
"r_y2": 85.57,
"r_x3": 467.39,
"r_y3": 85.57,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.38,
"r_y0": 146.54,
"r_x1": 182.63,
"r_y1": 146.54,
"r_x2": 182.63,
"r_y2": 141.58,
"r_x3": 160.38,
"r_y3": 141.58,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.74,
"r_y0": 99.82,
"r_x1": 173.33,
"r_y1": 99.82,
"r_x2": 173.33,
"r_y2": 94.86,
"r_x3": 153.74,
"r_y3": 94.86,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.51,
"r_y0": 105.94,
"r_x1": 173.32,
"r_y1": 105.94,
"r_x2": 173.32,
"r_y2": 100.98,
"r_x3": 154.51,
"r_y3": 100.98,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.27,
"r_y0": 112.06,
"r_x1": 173.33,
"r_y1": 112.06,
"r_x2": 173.33,
"r_y2": 107.1,
"r_x3": 155.27,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.41,
"r_y0": 112.19,
"r_x1": 346.0,
"r_y1": 112.19,
"r_x2": 346.0,
"r_y2": 107.23,
"r_x3": 326.41,
"r_y3": 107.23,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.18,
"r_y0": 118.31,
"r_x1": 345.99,
"r_y1": 118.31,
"r_x2": 345.99,
"r_y2": 113.35,
"r_x3": 327.18,
"r_y3": 113.35,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.94,
"r_y0": 124.43,
"r_x1": 346.0,
"r_y1": 124.43,
"r_x2": 346.0,
"r_y2": 119.47,
"r_x3": 327.94,
"r_y3": 119.47,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.99,
"r_y0": 109.11,
"r_x1": 508.76,
"r_y1": 109.11,
"r_x2": 508.76,
"r_y2": 104.15,
"r_x3": 488.99,
"r_y3": 104.15,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.19,
"r_y0": 115.23,
"r_x1": 508.76,
"r_y1": 115.23,
"r_x2": 508.76,
"r_y2": 110.27,
"r_x3": 490.19,
"r_y3": 110.27,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.72,
"r_y0": 121.35,
"r_x1": 508.77,
"r_y1": 121.35,
"r_x2": 508.77,
"r_y2": 116.39,
"r_x3": 489.72,
"r_y3": 116.39,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.71,
"r_y0": 127.47,
"r_x1": 508.77,
"r_y1": 127.47,
"r_x2": 508.77,
"r_y2": 122.51,
"r_x3": 490.71,
"r_y3": 122.51,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.38,
"r_y0": 146.67,
"r_x1": 202.84,
"r_y1": 146.67,
"r_x2": 202.84,
"r_y2": 141.71,
"r_x3": 185.38,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.09,
"r_x1": 197.53,
"r_y1": 91.09,
"r_x2": 197.53,
"r_y2": 86.14,
"r_x3": 168.5,
"r_y3": 86.14,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.38,
"r_y0": 90.95,
"r_x1": 367.4,
"r_y1": 90.95,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.38,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.73,
"r_y0": 146.58,
"r_x1": 374.93,
"r_y1": 146.58,
"r_x2": 374.93,
"r_y2": 141.62,
"r_x3": 333.73,
"r_y3": 141.62,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.69,
"r_y0": 91.01,
"r_x1": 355.71,
"r_y1": 91.01,
"r_x2": 355.71,
"r_y2": 86.06,
"r_x3": 345.69,
"r_y3": 86.06,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.54,
"r_y0": 146.33,
"r_x1": 526.01,
"r_y1": 146.33,
"r_x2": 526.01,
"r_y2": 141.38,
"r_x3": 508.54,
"r_y3": 141.38,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.45,
"r_y0": 91.05,
"r_x1": 523.71,
"r_y1": 91.05,
"r_x2": 523.71,
"r_y2": 86.09,
"r_x3": 510.45,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 46,
"label": "text",
"bbox": {
"l": 119.39,
"t": 77.31,
"r": 151.95,
"b": 83.26,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.39,
"r_y0": 83.26,
"r_x1": 151.95,
"r_y1": 83.26,
"r_x2": 151.95,
"r_y2": 77.31,
"r_x3": 119.39,
"r_y3": 77.31,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 53.35,
"t": 75.19,
"r": 59.33,
"b": 81.14,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.35,
"r_y0": 81.14,
"r_x1": 59.33,
"r_y1": 81.14,
"r_x2": 59.33,
"r_y2": 75.19,
"r_x3": 53.35,
"r_y3": 75.19,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 289.58,
"t": 77.46,
"r": 319.83,
"b": 83.41,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.58,
"r_y0": 83.41,
"r_x1": 319.83,
"r_y1": 83.41,
"r_x2": 319.83,
"r_y2": 77.46,
"r_x3": 289.58,
"r_y3": 77.46,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 448.37,
"t": 77.25,
"r": 481.76,
"b": 83.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.37,
"r_y0": 83.2,
"r_x1": 481.76,
"r_y1": 83.2,
"r_x2": 481.76,
"r_y2": 77.25,
"r_x3": 448.37,
"r_y3": 77.25,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 82.55,
"t": 141.28,
"r": 94.98,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.55,
"r_y0": 146.23,
"r_x1": 94.98,
"r_y1": 146.23,
"r_x2": 94.98,
"r_y2": 141.28,
"r_x3": 82.55,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 63.04,
"t": 101.1,
"r": 85.29,
"b": 106.06,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.04,
"r_y0": 106.06,
"r_x1": 85.29,
"r_y1": 106.06,
"r_x2": 85.29,
"r_y2": 101.1,
"r_x3": 63.04,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 67.77,
"t": 124.4,
"r": 85.23,
"b": 129.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.77,
"r_y0": 129.35,
"r_x1": 85.23,
"r_y1": 129.35,
"r_x2": 85.23,
"r_y2": 124.4,
"r_x3": 67.77,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 227.55,
"t": 102.54,
"r": 249.8,
"b": 107.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.55,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.54,
"r_x3": 227.55,
"r_y3": 102.54,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 232.2,
"t": 126.99,
"r": 249.66,
"b": 131.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.94,
"r_x1": 249.66,
"r_y1": 131.94,
"r_x2": 249.66,
"r_y2": 126.99,
"r_x3": 232.2,
"r_y3": 126.99,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 396.23,
"t": 114.05,
"r": 413.7,
"b": 119.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.23,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.05,
"r_x3": 396.23,
"r_y3": 114.05,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 97.38,
"t": 141.28,
"r": 105.08,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.38,
"r_y0": 146.23,
"r_x1": 105.08,
"r_y1": 146.23,
"r_x2": 105.08,
"r_y2": 141.28,
"r_x3": 97.38,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 60.94,
"t": 85.73,
"r": 76.15,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.94,
"r_y0": 90.69,
"r_x1": 76.15,
"r_y1": 90.69,
"r_x2": 76.15,
"r_y2": 85.73,
"r_x3": 60.94,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 82.3,
"t": 86.22,
"r": 106.99,
"b": 91.18,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.18,
"r_x1": 106.99,
"r_y1": 91.18,
"r_x2": 106.99,
"r_y2": 86.22,
"r_x3": 82.3,
"r_y3": 86.22,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 246.21,
"t": 141.61,
"r": 281.88,
"b": 146.56,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.21,
"r_y0": 146.56,
"r_x1": 281.88,
"r_y1": 146.56,
"r_x2": 281.88,
"r_y2": 141.61,
"r_x3": 246.21,
"r_y3": 141.61,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 226.7,
"t": 85.73,
"r": 241.91,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.69,
"r_x1": 241.91,
"r_y1": 90.69,
"r_x2": 241.91,
"r_y2": 85.73,
"r_x3": 226.7,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 249.94,
"t": 86.09,
"r": 282.49,
"b": 91.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.94,
"r_y0": 91.05,
"r_x1": 282.49,
"r_y1": 91.05,
"r_x2": 282.49,
"r_y2": 86.09,
"r_x3": 249.94,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 410.19,
"t": 141.28,
"r": 444.69,
"b": 146.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.19,
"r_y0": 146.23,
"r_x1": 444.69,
"r_y1": 146.23,
"r_x2": 444.69,
"r_y2": 141.28,
"r_x3": 410.19,
"r_y3": 141.28,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 391.37,
"t": 85.73,
"r": 432.67,
"b": 90.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.37,
"r_y0": 90.69,
"r_x1": 432.67,
"r_y1": 90.69,
"r_x2": 432.67,
"r_y2": 85.73,
"r_x3": 391.37,
"r_y3": 85.73,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 435.61,
"t": 86.26,
"r": 445.62,
"b": 91.22,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.61,
"r_y0": 91.22,
"r_x1": 445.62,
"r_y1": 91.22,
"r_x2": 445.62,
"r_y2": 86.26,
"r_x3": 435.61,
"r_y3": 86.26,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 113.95,
"t": 141.29,
"r": 136.2,
"b": 146.25,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.95,
"r_y0": 146.25,
"r_x1": 136.2,
"r_y1": 146.25,
"r_x2": 136.2,
"r_y2": 141.29,
"r_x3": 113.95,
"r_y3": 141.29,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 116.92,
"t": 94.82,
"r": 127.05,
"b": 99.78,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.92,
"r_y0": 99.78,
"r_x1": 127.05,
"r_y1": 99.78,
"r_x2": 127.05,
"r_y2": 94.82,
"r_x3": 116.92,
"r_y3": 94.82,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 113.31,
"t": 100.94,
"r": 127.05,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.31,
"r_y0": 105.9,
"r_x1": 127.05,
"r_y1": 105.9,
"r_x2": 127.05,
"r_y2": 100.94,
"r_x3": 113.31,
"r_y3": 100.94,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 112.94,
"t": 107.06,
"r": 127.06,
"b": 112.02,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.94,
"r_y0": 112.02,
"r_x1": 127.06,
"r_y1": 112.02,
"r_x2": 127.06,
"r_y2": 107.06,
"r_x3": 112.94,
"r_y3": 107.06,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 113.23,
"t": 122.62,
"r": 126.97,
"b": 127.57,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.23,
"r_y0": 127.57,
"r_x1": 126.97,
"r_y1": 127.57,
"r_x2": 126.97,
"r_y2": 122.62,
"r_x3": 113.23,
"r_y3": 122.62,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 112.85,
"t": 128.74,
"r": 126.97,
"b": 133.69,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.85,
"r_y0": 133.69,
"r_x1": 126.97,
"r_y1": 133.69,
"r_x2": 126.97,
"r_y2": 128.74,
"r_x3": 112.85,
"r_y3": 128.74,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 138.58,
"t": 141.44,
"r": 156.04,
"b": 146.39,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.58,
"r_y0": 146.39,
"r_x1": 156.04,
"r_y1": 146.39,
"r_x2": 156.04,
"r_y2": 141.44,
"r_x3": 138.58,
"r_y3": 141.44,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 122.03,
"t": 86.27,
"r": 151.04,
"b": 91.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.03,
"r_y0": 91.23,
"r_x1": 151.04,
"r_y1": 91.23,
"r_x2": 151.04,
"r_y2": 86.27,
"r_x3": 122.03,
"r_y3": 86.27,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 311.65,
"t": 86.55,
"r": 321.67,
"b": 91.51,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.65,
"r_y0": 91.51,
"r_x1": 321.67,
"r_y1": 91.51,
"r_x2": 321.67,
"r_y2": 86.55,
"r_x3": 311.65,
"r_y3": 86.55,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 287.89,
"t": 141.71,
"r": 310.15,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.89,
"r_y0": 146.67,
"r_x1": 310.15,
"r_y1": 146.67,
"r_x2": 310.15,
"r_y2": 141.71,
"r_x3": 287.89,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 289.24,
"t": 93.08,
"r": 299.37,
"b": 98.04,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.24,
"r_y0": 98.04,
"r_x1": 299.37,
"r_y1": 98.04,
"r_x2": 299.37,
"r_y2": 93.08,
"r_x3": 289.24,
"r_y3": 93.08,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 285.64,
"t": 99.2,
"r": 299.37,
"b": 104.16,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.64,
"r_y0": 104.16,
"r_x1": 299.37,
"r_y1": 104.16,
"r_x2": 299.37,
"r_y2": 99.2,
"r_x3": 285.64,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 285.26,
"t": 105.32,
"r": 299.38,
"b": 110.28,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.26,
"r_y0": 110.28,
"r_x1": 299.38,
"r_y1": 110.28,
"r_x2": 299.38,
"r_y2": 105.32,
"r_x3": 285.26,
"r_y3": 105.32,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 285.43,
"t": 120.39,
"r": 299.17,
"b": 125.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.43,
"r_y0": 125.35,
"r_x1": 299.17,
"r_y1": 125.35,
"r_x2": 299.17,
"r_y2": 120.39,
"r_x3": 285.43,
"r_y3": 120.39,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 285.06,
"t": 126.51,
"r": 299.17,
"b": 131.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.06,
"r_y0": 131.47,
"r_x1": 299.17,
"r_y1": 131.47,
"r_x2": 299.17,
"r_y2": 126.51,
"r_x3": 285.06,
"r_y3": 126.51,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 311.35,
"t": 141.71,
"r": 328.81,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.35,
"r_y0": 146.67,
"r_x1": 328.81,
"r_y1": 146.67,
"r_x2": 328.81,
"r_y2": 141.71,
"r_x3": 311.35,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 299.58,
"t": 86.69,
"r": 309.6,
"b": 91.65,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.58,
"r_y0": 91.65,
"r_x1": 309.6,
"r_y1": 91.65,
"r_x2": 309.6,
"r_y2": 86.69,
"r_x3": 299.58,
"r_y3": 86.69,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 466.04,
"t": 141.67,
"r": 483.5,
"b": 146.63,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.04,
"r_y0": 146.63,
"r_x1": 483.5,
"r_y1": 146.63,
"r_x2": 483.5,
"r_y2": 141.67,
"r_x3": 466.04,
"r_y3": 141.67,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 459.02,
"t": 93.76,
"r": 469.16,
"b": 98.72,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.02,
"r_y0": 98.72,
"r_x1": 469.16,
"r_y1": 98.72,
"r_x2": 469.16,
"r_y2": 93.76,
"r_x3": 459.02,
"r_y3": 93.76,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 455.42,
"t": 99.88,
"r": 469.16,
"b": 104.84,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.42,
"r_y0": 104.84,
"r_x1": 469.16,
"r_y1": 104.84,
"r_x2": 469.16,
"r_y2": 99.88,
"r_x3": 455.42,
"r_y3": 99.88,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 455.05,
"t": 106.0,
"r": 469.16,
"b": 110.96,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.05,
"r_y0": 110.96,
"r_x1": 469.16,
"r_y1": 110.96,
"r_x2": 469.16,
"r_y2": 106.0,
"r_x3": 455.05,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 467.39,
"t": 85.57,
"r": 480.65,
"b": 90.53,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.39,
"r_y0": 90.53,
"r_x1": 480.65,
"r_y1": 90.53,
"r_x2": 480.65,
"r_y2": 85.57,
"r_x3": 467.39,
"r_y3": 85.57,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 160.38,
"t": 141.58,
"r": 182.63,
"b": 146.54,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.38,
"r_y0": 146.54,
"r_x1": 182.63,
"r_y1": 146.54,
"r_x2": 182.63,
"r_y2": 141.58,
"r_x3": 160.38,
"r_y3": 141.58,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 153.74,
"t": 94.86,
"r": 173.33,
"b": 99.82,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.74,
"r_y0": 99.82,
"r_x1": 173.33,
"r_y1": 99.82,
"r_x2": 173.33,
"r_y2": 94.86,
"r_x3": 153.74,
"r_y3": 94.86,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 154.51,
"t": 100.98,
"r": 173.32,
"b": 105.94,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.51,
"r_y0": 105.94,
"r_x1": 173.32,
"r_y1": 105.94,
"r_x2": 173.32,
"r_y2": 100.98,
"r_x3": 154.51,
"r_y3": 100.98,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 155.27,
"t": 107.1,
"r": 173.33,
"b": 112.06,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.27,
"r_y0": 112.06,
"r_x1": 173.33,
"r_y1": 112.06,
"r_x2": 173.33,
"r_y2": 107.1,
"r_x3": 155.27,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.41,
"t": 107.23,
"r": 346.0,
"b": 112.19,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.41,
"r_y0": 112.19,
"r_x1": 346.0,
"r_y1": 112.19,
"r_x2": 346.0,
"r_y2": 107.23,
"r_x3": 326.41,
"r_y3": 107.23,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 327.18,
"t": 113.35,
"r": 345.99,
"b": 118.31,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.18,
"r_y0": 118.31,
"r_x1": 345.99,
"r_y1": 118.31,
"r_x2": 345.99,
"r_y2": 113.35,
"r_x3": 327.18,
"r_y3": 113.35,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 327.94,
"t": 119.47,
"r": 346.0,
"b": 124.43,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.94,
"r_y0": 124.43,
"r_x1": 346.0,
"r_y1": 124.43,
"r_x2": 346.0,
"r_y2": 119.47,
"r_x3": 327.94,
"r_y3": 119.47,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 488.99,
"t": 104.15,
"r": 508.76,
"b": 109.11,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.99,
"r_y0": 109.11,
"r_x1": 508.76,
"r_y1": 109.11,
"r_x2": 508.76,
"r_y2": 104.15,
"r_x3": 488.99,
"r_y3": 104.15,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 490.19,
"t": 110.27,
"r": 508.76,
"b": 115.23,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.19,
"r_y0": 115.23,
"r_x1": 508.76,
"r_y1": 115.23,
"r_x2": 508.76,
"r_y2": 110.27,
"r_x3": 490.19,
"r_y3": 110.27,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 489.72,
"t": 116.39,
"r": 508.77,
"b": 121.35,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.72,
"r_y0": 121.35,
"r_x1": 508.77,
"r_y1": 121.35,
"r_x2": 508.77,
"r_y2": 116.39,
"r_x3": 489.72,
"r_y3": 116.39,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 490.71,
"t": 122.51,
"r": 508.77,
"b": 127.47,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.71,
"r_y0": 127.47,
"r_x1": 508.77,
"r_y1": 127.47,
"r_x2": 508.77,
"r_y2": 122.51,
"r_x3": 490.71,
"r_y3": 122.51,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 185.38,
"t": 141.71,
"r": 202.84,
"b": 146.67,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.38,
"r_y0": 146.67,
"r_x1": 202.84,
"r_y1": 146.67,
"r_x2": 202.84,
"r_y2": 141.71,
"r_x3": 185.38,
"r_y3": 141.71,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 168.5,
"t": 86.14,
"r": 197.53,
"b": 91.09,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.09,
"r_x1": 197.53,
"r_y1": 91.09,
"r_x2": 197.53,
"r_y2": 86.14,
"r_x3": 168.5,
"r_y3": 86.14,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 357.38,
"t": 86.0,
"r": 367.4,
"b": 90.95,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.38,
"r_y0": 90.95,
"r_x1": 367.4,
"r_y1": 90.95,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.38,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 333.73,
"t": 141.62,
"r": 374.93,
"b": 146.58,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.73,
"r_y0": 146.58,
"r_x1": 374.93,
"r_y1": 146.58,
"r_x2": 374.93,
"r_y2": 141.62,
"r_x3": 333.73,
"r_y3": 141.62,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 345.69,
"t": 86.06,
"r": 355.71,
"b": 91.01,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.69,
"r_y0": 91.01,
"r_x1": 355.71,
"r_y1": 91.01,
"r_x2": 355.71,
"r_y2": 86.06,
"r_x3": 345.69,
"r_y3": 86.06,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 508.54,
"t": 141.38,
"r": 526.01,
"b": 146.33,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.54,
"r_y0": 146.33,
"r_x1": 526.01,
"r_y1": 146.33,
"r_x2": 526.01,
"r_y2": 141.38,
"r_x3": 508.54,
"r_y3": 141.38,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 510.45,
"t": 86.09,
"r": 523.71,
"b": 91.05,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.45,
"r_y0": 91.05,
"r_x1": 523.71,
"r_y1": 91.05,
"r_x2": 523.71,
"r_y2": 86.09,
"r_x3": 510.45,
"r_y3": 86.09,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 1,
"page_no": 11,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 165.5,
"r": 545.11,
"b": 186.36,
"coord_origin": "TOPLEFT"
},
"confidence": 0.966,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 174.41,
"r_x1": 545.11,
"r_y1": 174.41,
"r_x2": 545.11,
"r_y2": 165.5,
"r_x3": 50.11,
"r_y3": 165.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 186.36,
"r_x1": 513.52,
"r_y1": 186.36,
"r_x2": 513.52,
"r_y2": 177.46,
"r_x3": 50.11,
"r_y3": 177.46,
"coord_origin": "TOPLEFT"
},
"text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity."
},
{
"label": "list_item",
"id": 4,
"page_no": 11,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 210.93,
"r": 286.37,
"b": 231.79,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 219.84,
"r_x1": 71.15,
"r_y1": 219.84,
"r_x2": 71.15,
"r_y2": 210.93,
"r_x3": 61.57,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.54,
"r_y0": 219.84,
"r_x1": 286.37,
"r_y1": 219.84,
"r_x2": 286.37,
"r_y2": 210.93,
"r_x3": 73.54,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer output does not include the table cell con-",
"orig": "TableFormer output does not include the table cell con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 231.79,
"r_x1": 87.47,
"r_y1": 231.79,
"r_x2": 87.47,
"r_y2": 222.89,
"r_x3": 70.04,
"r_y3": 222.89,
"coord_origin": "TOPLEFT"
},
"text": "tent.",
"orig": "tent.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 TableFormer output does not include the table cell content."
},
{
"label": "list_item",
"id": 3,
"page_no": 11,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 61.57,
"t": 244.07,
"r": 286.37,
"b": 264.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.963,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.57,
"r_y0": 252.98,
"r_x1": 71.35,
"r_y1": 252.98,
"r_x2": 71.35,
"r_y2": 244.07,
"r_x3": 61.57,
"r_y3": 244.07,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.79,
"r_y0": 252.98,
"r_x1": 286.37,
"r_y1": 252.98,
"r_x2": 286.37,
"r_y2": 244.07,
"r_x3": 73.79,
"r_y3": 244.07,
"coord_origin": "TOPLEFT"
},
"text": "There are occasional inaccuracies in the predictions of",
"orig": "There are occasional inaccuracies in the predictions of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.04,
"r_y0": 264.93,
"r_x1": 150.42,
"r_y1": 264.93,
"r_x2": 150.42,
"r_y2": 256.03,
"r_x3": 70.04,
"r_y3": 256.03,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes.",
"orig": "the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes."
},
{
"label": "text",
"id": 0,
"page_no": 11,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.11,
"t": 279.2,
"r": 286.37,
"b": 395.71,
"coord_origin": "TOPLEFT"
},
"confidence": 0.977,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 288.11,
"r_x1": 286.36,
"r_y1": 288.11,
"r_x2": 286.36,
"r_y2": 279.2,
"r_x3": 62.07,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "However, it is possible to mitigate those limitations by",
"orig": "However, it is possible to mitigate those limitations by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 300.06,
"r_x1": 286.37,
"r_y1": 300.06,
"r_x2": 286.37,
"r_y2": 291.16,
"r_x3": 50.11,
"r_y3": 291.16,
"coord_origin": "TOPLEFT"
},
"text": "combining the TableFormer predictions with the informa-",
"orig": "combining the TableFormer predictions with the informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 312.02,
"r_x1": 286.37,
"r_y1": 312.02,
"r_x2": 286.37,
"r_y2": 303.11,
"r_x3": 50.11,
"r_y3": 303.11,
"coord_origin": "TOPLEFT"
},
"text": "tion already present inside a programmatic PDF document.",
"orig": "tion already present inside a programmatic PDF document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 323.97,
"r_x1": 286.37,
"r_y1": 323.97,
"r_x2": 286.37,
"r_y2": 315.07,
"r_x3": 50.11,
"r_y3": 315.07,
"coord_origin": "TOPLEFT"
},
"text": "More specifically, PDF documents can be seen as a se-",
"orig": "More specifically, PDF documents can be seen as a se-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 335.93,
"r_x1": 286.37,
"r_y1": 335.93,
"r_x2": 286.37,
"r_y2": 327.02,
"r_x3": 50.11,
"r_y3": 327.02,
"coord_origin": "TOPLEFT"
},
"text": "quence of PDF cells where each cell is described by its con-",
"orig": "quence of PDF cells where each cell is described by its con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 347.89,
"r_x1": 286.37,
"r_y1": 347.89,
"r_x2": 286.37,
"r_y2": 338.98,
"r_x3": 50.11,
"r_y3": 338.98,
"coord_origin": "TOPLEFT"
},
"text": "tent and bounding box. If we are able to associate the PDF",
"orig": "tent and bounding box. If we are able to associate the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 359.84,
"r_x1": 286.37,
"r_y1": 359.84,
"r_x2": 286.37,
"r_y2": 350.93,
"r_x3": 50.11,
"r_y3": 350.93,
"coord_origin": "TOPLEFT"
},
"text": "cells with the predicted table cells, we can directly link the",
"orig": "cells with the predicted table cells, we can directly link the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 371.8,
"r_x1": 286.37,
"r_y1": 371.8,
"r_x2": 286.37,
"r_y2": 362.89,
"r_x3": 50.11,
"r_y3": 362.89,
"coord_origin": "TOPLEFT"
},
"text": "PDF cell content to the table cell structure and use the PDF",
"orig": "PDF cell content to the table cell structure and use the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 383.75,
"r_x1": 286.37,
"r_y1": 383.75,
"r_x2": 286.37,
"r_y2": 374.84,
"r_x3": 50.11,
"r_y3": 374.84,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes to correct misalignments in the predicted",
"orig": "bounding boxes to correct misalignments in the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 395.71,
"r_x1": 154.56,
"r_y1": 395.71,
"r_x2": 154.56,
"r_y2": 386.8,
"r_x3": 50.11,
"r_y3": 386.8,
"coord_origin": "TOPLEFT"
},
"text": "table cell bounding boxes.",
"orig": "table cell bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes."
},
{
"label": "text",
"id": 11,
"page_no": 11,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.11,
"t": 399.07,
"r": 286.36,
"b": 419.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.935,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 407.98,
"r_x1": 286.36,
"r_y1": 407.98,
"r_x2": 286.36,
"r_y2": 399.07,
"r_x3": 62.07,
"r_y3": 399.07,
"coord_origin": "TOPLEFT"
},
"text": "Here is a step-by-step description of the prediction post-",
"orig": "Here is a step-by-step description of the prediction post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 419.93,
"r_x1": 95.49,
"r_y1": 419.93,
"r_x2": 95.49,
"r_y2": 411.03,
"r_x3": 50.11,
"r_y3": 411.03,
"coord_origin": "TOPLEFT"
},
"text": "processing:",
"orig": "processing:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Here is a step-by-step description of the prediction postprocessing:"
},
{
"label": "list_item",
"id": 20,
"page_no": 11,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 423.3,
"r": 286.37,
"b": 456.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.828,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 432.2,
"r_x1": 69.37,
"r_y1": 432.2,
"r_x2": 69.37,
"r_y2": 423.3,
"r_x3": 62.07,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.81,
"r_y0": 432.2,
"r_x1": 286.37,
"r_y1": 432.2,
"r_x2": 286.37,
"r_y2": 423.3,
"r_x3": 71.81,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "Get the minimal grid dimensions - number of rows and",
"orig": "Get the minimal grid dimensions - number of rows and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 444.16,
"r_x1": 286.37,
"r_y1": 444.16,
"r_x2": 286.37,
"r_y2": 435.25,
"r_x3": 50.11,
"r_y3": 435.25,
"coord_origin": "TOPLEFT"
},
"text": "columns for the predicted table structure. This represents",
"orig": "columns for the predicted table structure. This represents",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 456.11,
"r_x1": 274.51,
"r_y1": 456.11,
"r_x2": 274.51,
"r_y2": 447.21,
"r_x3": 50.11,
"r_y3": 447.21,
"coord_origin": "TOPLEFT"
},
"text": "the most granular grid for the underlying table structure.",
"orig": "the most granular grid for the underlying table structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure."
},
{
"label": "list_item",
"id": 2,
"page_no": 11,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 459.48,
"r": 286.37,
"b": 504.25,
"coord_origin": "TOPLEFT"
},
"confidence": 0.965,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 468.38,
"r_x1": 69.54,
"r_y1": 468.38,
"r_x2": 69.54,
"r_y2": 459.48,
"r_x3": 62.07,
"r_y3": 459.48,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 77.43,
"r_y0": 468.38,
"r_x1": 286.36,
"r_y1": 468.38,
"r_x2": 286.36,
"r_y2": 459.48,
"r_x3": 77.43,
"r_y3": 459.48,
"coord_origin": "TOPLEFT"
},
"text": "Generate pair-wise matches between the bounding",
"orig": "Generate pair-wise matches between the bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 480.34,
"r_x1": 286.37,
"r_y1": 480.34,
"r_x2": 286.37,
"r_y2": 471.43,
"r_x3": 50.11,
"r_y3": 471.43,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the PDF cells and the predicted cells. The Intersec-",
"orig": "boxes of the PDF cells and the predicted cells. The Intersec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 492.29,
"r_x1": 286.37,
"r_y1": 492.29,
"r_x2": 286.37,
"r_y2": 483.39,
"r_x3": 50.11,
"r_y3": 483.39,
"coord_origin": "TOPLEFT"
},
"text": "tion Over Union (IOU) metric is used to evaluate the quality",
"orig": "tion Over Union (IOU) metric is used to evaluate the quality",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 504.25,
"r_x1": 110.7,
"r_y1": 504.25,
"r_x2": 110.7,
"r_y2": 495.34,
"r_x3": 50.11,
"r_y3": 495.34,
"coord_origin": "TOPLEFT"
},
"text": "of the matches.",
"orig": "of the matches.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches."
},
{
"label": "list_item",
"id": 10,
"page_no": 11,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 507.61,
"r": 286.36,
"b": 528.47,
"coord_origin": "TOPLEFT"
},
"confidence": 0.939,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 516.52,
"r_x1": 69.86,
"r_y1": 516.52,
"r_x2": 69.86,
"r_y2": 507.61,
"r_x3": 62.07,
"r_y3": 507.61,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.46,
"r_y0": 516.52,
"r_x1": 286.36,
"r_y1": 516.52,
"r_x2": 286.36,
"r_y2": 507.61,
"r_x3": 72.46,
"r_y3": 507.61,
"coord_origin": "TOPLEFT"
},
"text": "Use a carefully selected IOU threshold to designate",
"orig": "Use a carefully selected IOU threshold to designate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 528.47,
"r_x1": 226.07,
"r_y1": 528.47,
"r_x2": 226.07,
"r_y2": 519.57,
"r_x3": 50.11,
"r_y3": 519.57,
"coord_origin": "TOPLEFT"
},
"text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Use a carefully selected IOU threshold to designate the matches as \"good\" ones and \"bad\" ones."
},
{
"label": "list_item",
"id": 8,
"page_no": 11,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 531.84,
"r": 286.37,
"b": 564.65,
"coord_origin": "TOPLEFT"
},
"confidence": 0.949,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 540.74,
"r_x1": 286.36,
"r_y1": 540.74,
"r_x2": 286.36,
"r_y2": 531.84,
"r_x3": 62.07,
"r_y3": 531.84,
"coord_origin": "TOPLEFT"
},
"text": "3.a. If all IOU scores in a column are below the thresh-",
"orig": "3.a. If all IOU scores in a column are below the thresh-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 552.7,
"r_x1": 286.37,
"r_y1": 552.7,
"r_x2": 286.37,
"r_y2": 543.79,
"r_x3": 50.11,
"r_y3": 543.79,
"coord_origin": "TOPLEFT"
},
"text": "old, discard all predictions (structure and bounding boxes)",
"orig": "old, discard all predictions (structure and bounding boxes)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 564.65,
"r_x1": 114.03,
"r_y1": 564.65,
"r_x2": 114.03,
"r_y2": 555.75,
"r_x3": 50.11,
"r_y3": 555.75,
"coord_origin": "TOPLEFT"
},
"text": "for that column.",
"orig": "for that column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column."
},
{
"label": "list_item",
"id": 5,
"page_no": 11,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 568.02,
"r": 286.37,
"b": 600.83,
"coord_origin": "TOPLEFT"
},
"confidence": 0.959,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 576.92,
"r_x1": 69.54,
"r_y1": 576.92,
"r_x2": 69.54,
"r_y2": 568.02,
"r_x3": 62.07,
"r_y3": 568.02,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.73,
"r_y0": 576.92,
"r_x1": 286.37,
"r_y1": 576.92,
"r_x2": 286.37,
"r_y2": 568.02,
"r_x3": 76.73,
"r_y3": 568.02,
"coord_origin": "TOPLEFT"
},
"text": "Find the best-fitting content alignment for the pre-",
"orig": "Find the best-fitting content alignment for the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 588.88,
"r_x1": 286.37,
"r_y1": 588.88,
"r_x2": 286.37,
"r_y2": 579.97,
"r_x3": 50.11,
"r_y3": 579.97,
"coord_origin": "TOPLEFT"
},
"text": "dicted cells with good IOU per each column. The alignment",
"orig": "dicted cells with good IOU per each column. The alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 600.83,
"r_x1": 278.7,
"r_y1": 600.83,
"r_x2": 278.7,
"r_y2": 591.93,
"r_x3": 50.11,
"r_y3": 591.93,
"coord_origin": "TOPLEFT"
},
"text": "of the column can be identified by the following formula:",
"orig": "of the column can be identified by the following formula:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:"
},
{
"label": "formula",
"id": 12,
"page_no": 11,
"cluster": {
"id": 12,
"label": "formula",
"bbox": {
"l": 110.7,
"t": 623.44,
"r": 286.36,
"b": 654.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.03,
"r_y0": 632.84,
"r_x1": 157.95,
"r_y1": 632.84,
"r_x2": 157.95,
"r_y2": 623.99,
"r_x3": 112.03,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "alignment",
"orig": "alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.72,
"r_y0": 632.84,
"r_x1": 203.5,
"r_y1": 632.84,
"r_x2": 203.5,
"r_y2": 623.99,
"r_x3": 160.72,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "= arg min",
"orig": "= arg min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.58,
"r_y0": 640.18,
"r_x1": 189.15,
"r_y1": 640.18,
"r_x2": 189.15,
"r_y2": 633.98,
"r_x3": 185.58,
"r_y3": 633.98,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 203.5,
"r_y0": 632.84,
"r_x1": 208.48,
"r_y1": 632.84,
"r_x2": 208.48,
"r_y2": 623.44,
"r_x3": 203.5,
"r_y3": 623.44,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.48,
"r_y0": 632.84,
"r_x1": 220.29,
"r_y1": 632.84,
"r_x2": 220.29,
"r_y2": 623.99,
"r_x3": 208.48,
"r_y3": 623.99,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.79,
"r_y0": 632.84,
"r_x1": 225.77,
"r_y1": 632.84,
"r_x2": 225.77,
"r_y2": 623.44,
"r_x3": 220.79,
"r_y3": 623.44,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 654.11,
"r_x1": 122.51,
"r_y1": 654.11,
"r_x2": 122.51,
"r_y2": 645.26,
"r_x3": 110.7,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.78,
"r_y0": 654.11,
"r_x1": 133.53,
"r_y1": 654.11,
"r_x2": 133.53,
"r_y2": 645.26,
"r_x3": 125.78,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 136.29,
"r_y0": 654.11,
"r_x1": 156.0,
"r_y1": 654.11,
"r_x2": 156.0,
"r_y2": 645.26,
"r_x3": 136.29,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "max",
"orig": "max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 654.11,
"r_x1": 160.98,
"r_y1": 654.11,
"r_x2": 160.98,
"r_y2": 644.7,
"r_x3": 156.0,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.98,
"r_y0": 654.11,
"r_x1": 170.24,
"r_y1": 654.11,
"r_x2": 170.24,
"r_y2": 645.26,
"r_x3": 160.98,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.74,
"r_y0": 654.11,
"r_x1": 185.68,
"r_y1": 654.11,
"r_x2": 185.68,
"r_y2": 644.7,
"r_x3": 170.74,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "} \u2212",
"orig": "} \u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.89,
"r_y0": 654.11,
"r_x1": 206.05,
"r_y1": 654.11,
"r_x2": 206.05,
"r_y2": 645.26,
"r_x3": 187.89,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "min",
"orig": "min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.05,
"r_y0": 654.11,
"r_x1": 211.04,
"r_y1": 654.11,
"r_x2": 211.04,
"r_y2": 644.7,
"r_x3": 206.05,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.03,
"r_y0": 654.11,
"r_x1": 220.29,
"r_y1": 654.11,
"r_x2": 220.29,
"r_y2": 645.26,
"r_x3": 211.03,
"r_y3": 645.26,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.79,
"r_y0": 654.11,
"r_x1": 225.77,
"r_y1": 654.11,
"r_x2": 225.77,
"r_y2": 644.7,
"r_x3": 220.79,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.75,
"r_y0": 643.79,
"r_x1": 286.36,
"r_y1": 643.79,
"r_x2": 286.36,
"r_y2": 634.89,
"r_x3": 274.75,
"r_y3": 634.89,
"coord_origin": "TOPLEFT"
},
"text": "(4)",
"orig": "(4)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "alignment = arg min c { D$_{c}$ } D$_{c}$ = max { x$_{c}$ } \u2212 min { x$_{c}$ } (4)"
},
{
"label": "text",
"id": 7,
"page_no": 11,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.11,
"t": 667.35,
"r": 286.36,
"b": 688.93,
"coord_origin": "TOPLEFT"
},
"confidence": 0.955,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 676.97,
"r_x1": 74.45,
"r_y1": 676.97,
"r_x2": 74.45,
"r_y2": 668.07,
"r_x3": 50.11,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.34,
"r_y0": 676.75,
"r_x1": 82.65,
"r_y1": 676.75,
"r_x2": 82.65,
"r_y2": 667.91,
"r_x3": 78.34,
"r_y3": 667.91,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.53,
"r_y0": 676.97,
"r_x1": 123.63,
"r_y1": 676.97,
"r_x2": 123.63,
"r_y2": 668.07,
"r_x3": 86.53,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "is one of",
"orig": "is one of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 127.52,
"r_y0": 676.75,
"r_x1": 132.5,
"r_y1": 676.75,
"r_x2": 132.5,
"r_y2": 667.35,
"r_x3": 127.52,
"r_y3": 667.35,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.5,
"r_y0": 676.97,
"r_x1": 210.7,
"r_y1": 676.97,
"r_x2": 210.7,
"r_y2": 668.07,
"r_x3": 132.5,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "left, centroid, right",
"orig": "left, centroid, right",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.7,
"r_y0": 676.75,
"r_x1": 215.68,
"r_y1": 676.75,
"r_x2": 215.68,
"r_y2": 667.35,
"r_x3": 210.7,
"r_y3": 667.35,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.56,
"r_y0": 676.97,
"r_x1": 233.95,
"r_y1": 676.97,
"r_x2": 233.95,
"r_y2": 668.07,
"r_x3": 219.56,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 237.83,
"r_y0": 676.75,
"r_x1": 247.09,
"r_y1": 676.75,
"r_x2": 247.09,
"r_y2": 667.91,
"r_x3": 237.83,
"r_y3": 667.91,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.47,
"r_y0": 676.97,
"r_x1": 286.36,
"r_y1": 676.97,
"r_x2": 286.36,
"r_y2": 668.07,
"r_x3": 251.47,
"r_y3": 668.07,
"coord_origin": "TOPLEFT"
},
"text": "is the x-",
"orig": "is the x-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 688.93,
"r_x1": 205.89,
"r_y1": 688.93,
"r_x2": 205.89,
"r_y2": 680.02,
"r_x3": 50.11,
"r_y3": 680.02,
"coord_origin": "TOPLEFT"
},
"text": "coordinate for the corresponding point.",
"orig": "coordinate for the corresponding point.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where c is one of { left, centroid, right } and x$_{c}$ is the xcoordinate for the corresponding point."
},
{
"label": "list_item",
"id": 13,
"page_no": 11,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.11,
"t": 692.29,
"r": 286.36,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 701.2,
"r_x1": 69.54,
"r_y1": 701.2,
"r_x2": 69.54,
"r_y2": 692.29,
"r_x3": 62.07,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.27,
"r_y0": 701.2,
"r_x1": 286.36,
"r_y1": 701.2,
"r_x2": 286.36,
"r_y2": 692.29,
"r_x3": 76.27,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "Use the alignment computed in step 4, to compute",
"orig": "Use the alignment computed in step 4, to compute",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 713.15,
"r_x1": 94.6,
"r_y1": 713.15,
"r_x2": 94.6,
"r_y2": 704.25,
"r_x3": 50.11,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "the median",
"orig": "the median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.6,
"r_y0": 712.93,
"r_x1": 103.29,
"r_y1": 712.93,
"r_x2": 103.29,
"r_y2": 704.09,
"r_x3": 97.6,
"r_y3": 704.09,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.29,
"r_y0": 713.15,
"r_x1": 286.36,
"r_y1": 713.15,
"r_x2": 286.36,
"r_y2": 704.25,
"r_x3": 103.29,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "-coordinate for all table columns and the me-",
"orig": "-coordinate for all table columns and the me-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-"
},
{
"label": "text",
"id": 16,
"page_no": 11,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 308.86,
"t": 210.93,
"r": 545.12,
"b": 255.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.894,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 219.84,
"r_x1": 545.12,
"r_y1": 219.84,
"r_x2": 545.12,
"r_y2": 210.93,
"r_x3": 308.86,
"r_y3": 210.93,
"coord_origin": "TOPLEFT"
},
"text": "dian cell size for all table cells. The usage of median dur-",
"orig": "dian cell size for all table cells. The usage of median dur-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 231.79,
"r_x1": 545.12,
"r_y1": 231.79,
"r_x2": 545.12,
"r_y2": 222.89,
"r_x3": 308.86,
"r_y3": 222.89,
"coord_origin": "TOPLEFT"
},
"text": "ing the computations, helps to eliminate outliers caused by",
"orig": "ing the computations, helps to eliminate outliers caused by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 243.75,
"r_x1": 545.12,
"r_y1": 243.75,
"r_x2": 545.12,
"r_y2": 234.84,
"r_x3": 308.86,
"r_y3": 234.84,
"coord_origin": "TOPLEFT"
},
"text": "occasional column spans which are usually wider than the",
"orig": "occasional column spans which are usually wider than the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 255.7,
"r_x1": 339.58,
"r_y1": 255.7,
"r_x2": 339.58,
"r_y2": 246.8,
"r_x3": 308.86,
"r_y3": 246.8,
"coord_origin": "TOPLEFT"
},
"text": "normal.",
"orig": "normal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal."
},
{
"label": "list_item",
"id": 9,
"page_no": 11,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 259.1,
"r": 545.11,
"b": 279.96,
"coord_origin": "TOPLEFT"
},
"confidence": 0.942,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 268.01,
"r_x1": 328.29,
"r_y1": 268.01,
"r_x2": 328.29,
"r_y2": 259.1,
"r_x3": 320.82,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 334.88,
"r_y0": 268.01,
"r_x1": 545.11,
"r_y1": 268.01,
"r_x2": 545.11,
"r_y2": 259.1,
"r_x3": 334.88,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "Snap all cells with bad IOU to their corresponding",
"orig": "Snap all cells with bad IOU to their corresponding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 279.96,
"r_x1": 338.19,
"r_y1": 279.96,
"r_x2": 338.19,
"r_y2": 271.06,
"r_x3": 308.86,
"r_y3": 271.06,
"coord_origin": "TOPLEFT"
},
"text": "median",
"orig": "median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 340.68,
"r_y0": 279.74,
"r_x1": 346.38,
"r_y1": 279.74,
"r_x2": 346.38,
"r_y2": 270.9,
"r_x3": 340.68,
"r_y3": 270.9,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.38,
"r_y0": 279.96,
"r_x1": 453.72,
"r_y1": 279.96,
"r_x2": 453.72,
"r_y2": 271.06,
"r_x3": 346.38,
"r_y3": 271.06,
"coord_origin": "TOPLEFT"
},
"text": "-coordinates and cell sizes.",
"orig": "-coordinates and cell sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes."
},
{
"label": "list_item",
"id": 6,
"page_no": 11,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 283.36,
"r": 545.12,
"b": 387.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.956,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 292.27,
"r_x1": 328.39,
"r_y1": 292.27,
"r_x2": 328.39,
"r_y2": 283.36,
"r_x3": 320.82,
"r_y3": 283.36,
"coord_origin": "TOPLEFT"
},
"text": "7.",
"orig": "7.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.91,
"r_y0": 292.27,
"r_x1": 545.11,
"r_y1": 292.27,
"r_x2": 545.11,
"r_y2": 283.36,
"r_x3": 330.91,
"r_y3": 283.36,
"coord_origin": "TOPLEFT"
},
"text": "Generate a new set of pair-wise matches between the",
"orig": "Generate a new set of pair-wise matches between the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 304.22,
"r_x1": 545.12,
"r_y1": 304.22,
"r_x2": 545.12,
"r_y2": 295.32,
"r_x3": 308.86,
"r_y3": 295.32,
"coord_origin": "TOPLEFT"
},
"text": "corrected bounding boxes and PDF cells. This time use a",
"orig": "corrected bounding boxes and PDF cells. This time use a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 316.18,
"r_x1": 545.12,
"r_y1": 316.18,
"r_x2": 545.12,
"r_y2": 307.27,
"r_x3": 308.86,
"r_y3": 307.27,
"coord_origin": "TOPLEFT"
},
"text": "modified version of the IOU metric, where the area of the",
"orig": "modified version of the IOU metric, where the area of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 328.13,
"r_x1": 545.12,
"r_y1": 328.13,
"r_x2": 545.12,
"r_y2": 319.23,
"r_x3": 308.86,
"r_y3": 319.23,
"coord_origin": "TOPLEFT"
},
"text": "intersection between the predicted and PDF cells is divided",
"orig": "intersection between the predicted and PDF cells is divided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 340.09,
"r_x1": 397.19,
"r_y1": 340.09,
"r_x2": 397.19,
"r_y2": 331.18,
"r_x3": 308.86,
"r_y3": 331.18,
"coord_origin": "TOPLEFT"
},
"text": "by the PDF cell area.",
"orig": "by the PDF cell area.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.66,
"r_y0": 340.09,
"r_x1": 545.12,
"r_y1": 340.09,
"r_x2": 545.12,
"r_y2": 331.18,
"r_x3": 403.66,
"r_y3": 331.18,
"coord_origin": "TOPLEFT"
},
"text": "In case there are multiple matches",
"orig": "In case there are multiple matches",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 352.05,
"r_x1": 545.12,
"r_y1": 352.05,
"r_x2": 545.12,
"r_y2": 343.14,
"r_x3": 308.86,
"r_y3": 343.14,
"coord_origin": "TOPLEFT"
},
"text": "for the same PDF cell, the prediction with the higher score",
"orig": "for the same PDF cell, the prediction with the higher score",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 364.0,
"r_x1": 545.12,
"r_y1": 364.0,
"r_x2": 545.12,
"r_y2": 355.09,
"r_x3": 308.86,
"r_y3": 355.09,
"coord_origin": "TOPLEFT"
},
"text": "is preferred. This covers the cases where the PDF cells are",
"orig": "is preferred. This covers the cases where the PDF cells are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 375.96,
"r_x1": 545.12,
"r_y1": 375.96,
"r_x2": 545.12,
"r_y2": 367.05,
"r_x3": 308.86,
"r_y3": 367.05,
"coord_origin": "TOPLEFT"
},
"text": "smaller than the area of predicted or corrected prediction",
"orig": "smaller than the area of predicted or corrected prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 387.91,
"r_x1": 329.61,
"r_y1": 387.91,
"r_x2": 329.61,
"r_y2": 379.0,
"r_x3": 308.86,
"r_y3": 379.0,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells."
},
{
"label": "list_item",
"id": 17,
"page_no": 11,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 391.31,
"r": 545.12,
"b": 459.99,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 400.22,
"r_x1": 328.55,
"r_y1": 400.22,
"r_x2": 328.55,
"r_y2": 391.31,
"r_x3": 320.82,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "8.",
"orig": "8.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.13,
"r_y0": 400.22,
"r_x1": 545.12,
"r_y1": 400.22,
"r_x2": 545.12,
"r_y2": 391.31,
"r_x3": 331.13,
"r_y3": 391.31,
"coord_origin": "TOPLEFT"
},
"text": "In some rare occasions, we have noticed that Table-",
"orig": "In some rare occasions, we have noticed that Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 412.17,
"r_x1": 545.12,
"r_y1": 412.17,
"r_x2": 545.12,
"r_y2": 403.27,
"r_x3": 308.86,
"r_y3": 403.27,
"coord_origin": "TOPLEFT"
},
"text": "Former can confuse a single column as two. When the post-",
"orig": "Former can confuse a single column as two. When the post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 424.13,
"r_x1": 545.12,
"r_y1": 424.13,
"r_x2": 545.12,
"r_y2": 415.22,
"r_x3": 308.86,
"r_y3": 415.22,
"coord_origin": "TOPLEFT"
},
"text": "processing steps are applied, this results with two predicted",
"orig": "processing steps are applied, this results with two predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 436.08,
"r_x1": 545.12,
"r_y1": 436.08,
"r_x2": 545.12,
"r_y2": 427.18,
"r_x3": 308.86,
"r_y3": 427.18,
"coord_origin": "TOPLEFT"
},
"text": "columns pointing to the same PDF column. In such case",
"orig": "columns pointing to the same PDF column. In such case",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 448.04,
"r_x1": 545.12,
"r_y1": 448.04,
"r_x2": 545.12,
"r_y2": 439.13,
"r_x3": 308.86,
"r_y3": 439.13,
"coord_origin": "TOPLEFT"
},
"text": "we must de-duplicate the columns according to highest to-",
"orig": "we must de-duplicate the columns according to highest to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 459.99,
"r_x1": 426.18,
"r_y1": 459.99,
"r_x2": 426.18,
"r_y2": 451.09,
"r_x3": 308.86,
"r_y3": 451.09,
"coord_origin": "TOPLEFT"
},
"text": "tal column intersection score.",
"orig": "tal column intersection score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score."
},
{
"label": "list_item",
"id": 15,
"page_no": 11,
"cluster": {
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 463.39,
"r": 545.12,
"b": 567.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 472.3,
"r_x1": 328.67,
"r_y1": 472.3,
"r_x2": 328.67,
"r_y2": 463.39,
"r_x3": 320.82,
"r_y3": 463.39,
"coord_origin": "TOPLEFT"
},
"text": "9.",
"orig": "9.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.29,
"r_y0": 472.3,
"r_x1": 545.11,
"r_y1": 472.3,
"r_x2": 545.11,
"r_y2": 463.39,
"r_x3": 331.29,
"r_y3": 463.39,
"coord_origin": "TOPLEFT"
},
"text": "Pick up the remaining orphan cells. There could be",
"orig": "Pick up the remaining orphan cells. There could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 484.25,
"r_x1": 545.12,
"r_y1": 484.25,
"r_x2": 545.12,
"r_y2": 475.35,
"r_x3": 308.86,
"r_y3": 475.35,
"coord_origin": "TOPLEFT"
},
"text": "cases, when after applying all the previous post-processing",
"orig": "cases, when after applying all the previous post-processing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 496.21,
"r_x1": 545.12,
"r_y1": 496.21,
"r_x2": 545.12,
"r_y2": 487.3,
"r_x3": 308.86,
"r_y3": 487.3,
"coord_origin": "TOPLEFT"
},
"text": "steps, some PDF cells could still remain without any match",
"orig": "steps, some PDF cells could still remain without any match",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 508.16,
"r_x1": 381.9,
"r_y1": 508.16,
"r_x2": 381.9,
"r_y2": 499.26,
"r_x3": 308.86,
"r_y3": 499.26,
"coord_origin": "TOPLEFT"
},
"text": "to predicted cells.",
"orig": "to predicted cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 508.16,
"r_x1": 545.12,
"r_y1": 508.16,
"r_x2": 545.12,
"r_y2": 499.26,
"r_x3": 388.7,
"r_y3": 499.26,
"coord_origin": "TOPLEFT"
},
"text": "However, it is still possible to deduce",
"orig": "However, it is still possible to deduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 520.12,
"r_x1": 545.12,
"r_y1": 520.12,
"r_x2": 545.12,
"r_y2": 511.21,
"r_x3": 308.86,
"r_y3": 511.21,
"coord_origin": "TOPLEFT"
},
"text": "the correct matching for an orphan PDF cell by mapping its",
"orig": "the correct matching for an orphan PDF cell by mapping its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 532.07,
"r_x1": 545.12,
"r_y1": 532.07,
"r_x2": 545.12,
"r_y2": 523.17,
"r_x3": 308.86,
"r_y3": 523.17,
"coord_origin": "TOPLEFT"
},
"text": "bounding box on the geometry of the grid. This mapping",
"orig": "bounding box on the geometry of the grid. This mapping",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 544.03,
"r_x1": 545.11,
"r_y1": 544.03,
"r_x2": 545.11,
"r_y2": 535.12,
"r_x3": 308.86,
"r_y3": 535.12,
"coord_origin": "TOPLEFT"
},
"text": "decides if the content of the orphan cell will be appended to",
"orig": "decides if the content of the orphan cell will be appended to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 555.98,
"r_x1": 545.12,
"r_y1": 555.98,
"r_x2": 545.12,
"r_y2": 547.08,
"r_x3": 308.86,
"r_y3": 547.08,
"coord_origin": "TOPLEFT"
},
"text": "an already matched table cell, or a new table cell should be",
"orig": "an already matched table cell, or a new table cell should be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 567.94,
"r_x1": 442.22,
"r_y1": 567.94,
"r_x2": 442.22,
"r_y2": 559.03,
"r_x3": 308.86,
"r_y3": 559.03,
"coord_origin": "TOPLEFT"
},
"text": "created to match with the orphan.",
"orig": "created to match with the orphan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan."
},
{
"label": "text",
"id": 19,
"page_no": 11,
"cluster": {
"id": 19,
"label": "text",
"bbox": {
"l": 308.86,
"t": 571.34,
"r": 545.12,
"b": 604.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.846,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 580.24,
"r_x1": 545.11,
"r_y1": 580.24,
"r_x2": 545.11,
"r_y2": 571.34,
"r_x3": 320.82,
"r_y3": 571.34,
"coord_origin": "TOPLEFT"
},
"text": "9a. Compute the top and bottom boundary of the hori-",
"orig": "9a. Compute the top and bottom boundary of the hori-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 592.2,
"r_x1": 471.64,
"r_y1": 592.2,
"r_x2": 471.64,
"r_y2": 583.29,
"r_x3": 308.86,
"r_y3": 583.29,
"coord_origin": "TOPLEFT"
},
"text": "zontal band for each grid row (min/max",
"orig": "zontal band for each grid row (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.83,
"r_y0": 591.98,
"r_x1": 479.72,
"r_y1": 591.98,
"r_x2": 479.72,
"r_y2": 583.13,
"r_x3": 474.83,
"r_y3": 583.13,
"coord_origin": "TOPLEFT"
},
"text": "y",
"orig": "y",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.27,
"r_y0": 592.2,
"r_x1": 545.12,
"r_y1": 592.2,
"r_x2": 545.12,
"r_y2": 583.29,
"r_x3": 483.27,
"r_y3": 583.29,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per",
"orig": "coordinates per",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 604.15,
"r_x1": 329.91,
"r_y1": 604.15,
"r_x2": 329.91,
"r_y2": 595.25,
"r_x3": 308.86,
"r_y3": 595.25,
"coord_origin": "TOPLEFT"
},
"text": "row).",
"orig": "row).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)."
},
{
"label": "list_item",
"id": 21,
"page_no": 11,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 607.55,
"r": 545.12,
"b": 628.42,
"coord_origin": "TOPLEFT"
},
"confidence": 0.772,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 616.46,
"r_x1": 332.87,
"r_y1": 616.46,
"r_x2": 332.87,
"r_y2": 607.55,
"r_x3": 320.82,
"r_y3": 607.55,
"coord_origin": "TOPLEFT"
},
"text": "9b.",
"orig": "9b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.93,
"r_y0": 616.46,
"r_x1": 545.12,
"r_y1": 616.46,
"r_x2": 545.12,
"r_y2": 607.55,
"r_x3": 339.93,
"r_y3": 607.55,
"coord_origin": "TOPLEFT"
},
"text": "Intersect the orphan\u2019s bounding box with the row",
"orig": "Intersect the orphan\u2019s bounding box with the row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 628.42,
"r_x1": 495.29,
"r_y1": 628.42,
"r_x2": 495.29,
"r_y2": 619.51,
"r_x3": 308.86,
"r_y3": 619.51,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid row.",
"orig": "bands, and map the cell to the closest grid row.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row."
},
{
"label": "list_item",
"id": 18,
"page_no": 11,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 631.81,
"r": 545.12,
"b": 664.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.858,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 640.72,
"r_x1": 545.12,
"r_y1": 640.72,
"r_x2": 545.12,
"r_y2": 631.81,
"r_x3": 320.82,
"r_y3": 631.81,
"coord_origin": "TOPLEFT"
},
"text": "9c. Compute the left and right boundary of the vertical",
"orig": "9c. Compute the left and right boundary of the vertical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 652.68,
"r_x1": 455.28,
"r_y1": 652.68,
"r_x2": 455.28,
"r_y2": 643.77,
"r_x3": 308.86,
"r_y3": 643.77,
"coord_origin": "TOPLEFT"
},
"text": "band for each grid column (min/max",
"orig": "band for each grid column (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 457.78,
"r_y0": 652.46,
"r_x1": 463.47,
"r_y1": 652.46,
"r_x2": 463.47,
"r_y2": 643.61,
"r_x3": 457.78,
"r_y3": 643.61,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.97,
"r_y0": 652.68,
"r_x1": 545.11,
"r_y1": 652.68,
"r_x2": 545.11,
"r_y2": 643.77,
"r_x3": 465.97,
"r_y3": 643.77,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per col-",
"orig": "coordinates per col-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 664.63,
"r_x1": 332.38,
"r_y1": 664.63,
"r_x2": 332.38,
"r_y2": 655.72,
"r_x3": 308.86,
"r_y3": 655.72,
"coord_origin": "TOPLEFT"
},
"text": "umn).",
"orig": "umn).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)."
},
{
"label": "list_item",
"id": 22,
"page_no": 11,
"cluster": {
"id": 22,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 668.03,
"r": 545.11,
"b": 688.89,
"coord_origin": "TOPLEFT"
},
"confidence": 0.759,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 676.94,
"r_x1": 545.11,
"r_y1": 676.94,
"r_x2": 545.11,
"r_y2": 668.03,
"r_x3": 320.82,
"r_y3": 668.03,
"coord_origin": "TOPLEFT"
},
"text": "9d. Intersect the orphan\u2019s bounding box with the column",
"orig": "9d. Intersect the orphan\u2019s bounding box with the column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 688.89,
"r_x1": 510.58,
"r_y1": 688.89,
"r_x2": 510.58,
"r_y2": 679.99,
"r_x3": 308.86,
"r_y3": 679.99,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid column.",
"orig": "bands, and map the cell to the closest grid column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column."
},
{
"label": "list_item",
"id": 25,
"page_no": 11,
"cluster": {
"id": 25,
"label": "list_item",
"bbox": {
"l": 308.86,
"t": 692.29,
"r": 545.12,
"b": 713.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.697,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.82,
"r_y0": 701.2,
"r_x1": 545.12,
"r_y1": 701.2,
"r_x2": 545.12,
"r_y2": 692.29,
"r_x3": 320.82,
"r_y3": 692.29,
"coord_origin": "TOPLEFT"
},
"text": "9e. If the table cell under the identified row and column",
"orig": "9e. If the table cell under the identified row and column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 713.15,
"r_x1": 545.12,
"r_y1": 713.15,
"r_x2": 545.12,
"r_y2": 704.25,
"r_x3": 308.86,
"r_y3": 704.25,
"coord_origin": "TOPLEFT"
},
"text": "is not empty, extend its content with the content of the or-",
"orig": "is not empty, extend its content with the content of the or-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-"
}
],
"headers": [
{
"label": "page_footer",
"id": 14,
"page_no": 11,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "12"
}
]
}
},
{
"page_no": 12,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 88.85,
"r_y1": 84.11,
"r_x2": 88.85,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "phan cell.",
"orig": "phan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 96.07,
"r_x1": 286.36,
"r_y1": 96.07,
"r_x2": 286.36,
"r_y2": 87.16,
"r_x3": 62.07,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "9f. Otherwise create a new structural cell and match it",
"orig": "9f. Otherwise create a new structural cell and match it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.02,
"r_x1": 127.03,
"r_y1": 108.02,
"r_x2": 127.03,
"r_y2": 99.12,
"r_x3": 50.11,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "wit the orphan cell.",
"orig": "wit the orphan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 119.75,
"r_x1": 286.36,
"r_y1": 119.75,
"r_x2": 286.36,
"r_y2": 111.16,
"r_x3": 62.07,
"r_y3": 111.16,
"coord_origin": "TOPLEFT"
},
"text": "Aditional images with examples of TableFormer predic-",
"orig": "Aditional images with examples of TableFormer predic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.71,
"r_x1": 234.06,
"r_y1": 131.71,
"r_x2": 234.06,
"r_y2": 123.12,
"r_x3": 50.11,
"r_y3": 123.12,
"coord_origin": "TOPLEFT"
},
"text": "tions and post-processing can be found below.",
"orig": "tions and post-processing can be found below.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.34,
"r_y0": 510.96,
"r_x1": 273.13,
"r_y1": 510.96,
"r_x2": 273.13,
"r_y2": 502.06,
"r_x3": 63.34,
"r_y3": 502.06,
"coord_origin": "TOPLEFT"
},
"text": "Figure 8: Example of a table with multi-line header.",
"orig": "Figure 8: Example of a table with multi-line header.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 315.5,
"r_x1": 345.63,
"r_y1": 315.5,
"r_x2": 345.63,
"r_y2": 306.6,
"r_x3": 308.86,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Figure 9:",
"orig": "Figure 9:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.79,
"r_y0": 315.5,
"r_x1": 545.12,
"r_y1": 315.5,
"r_x2": 545.12,
"r_y2": 306.6,
"r_x3": 352.79,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Example of a table with big empty distance be-",
"orig": "Example of a table with big empty distance be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 327.46,
"r_x1": 355.9,
"r_y1": 327.46,
"r_x2": 355.9,
"r_y2": 318.55,
"r_x3": 308.86,
"r_y3": 318.55,
"coord_origin": "TOPLEFT"
},
"text": "tween cells.",
"orig": "tween cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.34,
"r_y0": 689.4,
"r_x1": 541.63,
"r_y1": 689.4,
"r_x2": 541.63,
"r_y2": 680.49,
"r_x3": 312.34,
"r_y3": 680.49,
"coord_origin": "TOPLEFT"
},
"text": "Figure 10: Example of a complex table with empty cells.",
"orig": "Figure 10: Example of a complex table with empty cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 14,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 88.85,
"b": 84.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.755,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 88.85,
"r_y1": 84.11,
"r_x2": 88.85,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "phan cell.",
"orig": "phan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 87.16,
"r": 286.36,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.917,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 96.07,
"r_x1": 286.36,
"r_y1": 96.07,
"r_x2": 286.36,
"r_y2": 87.16,
"r_x3": 62.07,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "9f. Otherwise create a new structural cell and match it",
"orig": "9f. Otherwise create a new structural cell and match it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.02,
"r_x1": 127.03,
"r_y1": 108.02,
"r_x2": 127.03,
"r_y2": 99.12,
"r_x3": 50.11,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "wit the orphan cell.",
"orig": "wit the orphan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 111.16,
"r": 286.36,
"b": 131.71,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 119.75,
"r_x1": 286.36,
"r_y1": 119.75,
"r_x2": 286.36,
"r_y2": 111.16,
"r_x3": 62.07,
"r_y3": 111.16,
"coord_origin": "TOPLEFT"
},
"text": "Aditional images with examples of TableFormer predic-",
"orig": "Aditional images with examples of TableFormer predic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.71,
"r_x1": 234.06,
"r_y1": 131.71,
"r_x2": 234.06,
"r_y2": 123.12,
"r_x3": 50.11,
"r_y3": 123.12,
"coord_origin": "TOPLEFT"
},
"text": "tions and post-processing can be found below.",
"orig": "tions and post-processing can be found below.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "caption",
"bbox": {
"l": 63.34,
"t": 502.06,
"r": 273.13,
"b": 510.96,
"coord_origin": "TOPLEFT"
},
"confidence": 0.897,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.34,
"r_y0": 510.96,
"r_x1": 273.13,
"r_y1": 510.96,
"r_x2": 273.13,
"r_y2": 502.06,
"r_x3": 63.34,
"r_y3": 502.06,
"coord_origin": "TOPLEFT"
},
"text": "Figure 8: Example of a table with multi-line header.",
"orig": "Figure 8: Example of a table with multi-line header.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 306.6,
"r": 545.12,
"b": 327.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 315.5,
"r_x1": 345.63,
"r_y1": 315.5,
"r_x2": 345.63,
"r_y2": 306.6,
"r_x3": 308.86,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Figure 9:",
"orig": "Figure 9:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.79,
"r_y0": 315.5,
"r_x1": 545.12,
"r_y1": 315.5,
"r_x2": 545.12,
"r_y2": 306.6,
"r_x3": 352.79,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Example of a table with big empty distance be-",
"orig": "Example of a table with big empty distance be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 327.46,
"r_x1": 355.9,
"r_y1": 327.46,
"r_x2": 355.9,
"r_y2": 318.55,
"r_x3": 308.86,
"r_y3": 318.55,
"coord_origin": "TOPLEFT"
},
"text": "tween cells.",
"orig": "tween cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "caption",
"bbox": {
"l": 312.34,
"t": 680.49,
"r": 541.63,
"b": 689.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.919,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.34,
"r_y0": 689.4,
"r_x1": 541.63,
"r_y1": 689.4,
"r_x2": 541.63,
"r_y2": 680.49,
"r_x3": 312.34,
"r_y3": 680.49,
"coord_origin": "TOPLEFT"
},
"text": "Figure 10: Example of a complex table with empty cells.",
"orig": "Figure 10: Example of a complex table with empty cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.902,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "table",
"bbox": {
"l": 310.33,
"t": 101.18,
"r": 555.83,
"b": 136.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.705,
"cells": [],
"children": []
},
{
"id": 32,
"label": "table",
"bbox": {
"l": 309.96,
"t": 154.61,
"r": 555.75,
"b": 184.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.564,
"cells": [],
"children": []
},
{
"id": 9,
"label": "table",
"bbox": {
"l": 84.03,
"t": 156.33,
"r": 239.17,
"b": 214.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.886,
"cells": [],
"children": []
},
{
"id": 21,
"label": "table",
"bbox": {
"l": 309.96,
"t": 195.71,
"r": 555.71,
"b": 233.55,
"coord_origin": "TOPLEFT"
},
"confidence": 0.66,
"cells": [],
"children": []
},
{
"id": 4,
"label": "table",
"bbox": {
"l": 82.92,
"t": 233.78,
"r": 239.19,
"b": 291.28,
"coord_origin": "TOPLEFT"
},
"confidence": 0.916,
"cells": [],
"children": []
},
{
"id": 19,
"label": "picture",
"bbox": {
"l": 309.79,
"t": 253.91,
"r": 425.96,
"b": 292.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.696,
"cells": [],
"children": []
},
{
"id": 37,
"label": "table",
"bbox": {
"l": 309.79,
"t": 253.91,
"r": 425.96,
"b": 292.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.528,
"cells": [],
"children": []
},
{
"id": 6,
"label": "table",
"bbox": {
"l": 83.95,
"t": 309.05,
"r": 239.17,
"b": 367.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.909,
"cells": [],
"children": []
},
{
"id": 12,
"label": "table",
"bbox": {
"l": 335.27,
"t": 388.47,
"r": 490.08,
"b": 437.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.849,
"cells": [],
"children": []
},
{
"id": 0,
"label": "table",
"bbox": {
"l": 83.32,
"t": 396.01,
"r": 248.87,
"b": 487.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.961,
"cells": [],
"children": []
},
{
"id": 10,
"label": "table",
"bbox": {
"l": 334.93,
"t": 453.95,
"r": 490.09,
"b": 502.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [],
"children": []
},
{
"id": 5,
"label": "table",
"bbox": {
"l": 335.25,
"t": 519.08,
"r": 490.22,
"b": 567.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
{
"id": 13,
"label": "picture",
"bbox": {
"l": 333.96,
"t": 593.11,
"r": 518.48,
"b": 665.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.802,
"cells": [],
"children": []
},
{
"id": 30,
"label": "table",
"bbox": {
"l": 333.96,
"t": 593.11,
"r": 518.48,
"b": 665.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.593,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"17": {
"label": "table",
"id": 17,
"page_no": 12,
"cluster": {
"id": 17,
"label": "table",
"bbox": {
"l": 310.33,
"t": 101.18,
"r": 555.83,
"b": 136.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.705,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"32": {
"label": "table",
"id": 32,
"page_no": 12,
"cluster": {
"id": 32,
"label": "table",
"bbox": {
"l": 309.96,
"t": 154.61,
"r": 555.75,
"b": 184.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.564,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"9": {
"label": "table",
"id": 9,
"page_no": 12,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 84.03,
"t": 156.33,
"r": 239.17,
"b": 214.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.886,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"21": {
"label": "table",
"id": 21,
"page_no": 12,
"cluster": {
"id": 21,
"label": "table",
"bbox": {
"l": 309.96,
"t": 195.71,
"r": 555.71,
"b": 233.55,
"coord_origin": "TOPLEFT"
},
"confidence": 0.66,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"4": {
"label": "table",
"id": 4,
"page_no": 12,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 82.92,
"t": 233.78,
"r": 239.19,
"b": 291.28,
"coord_origin": "TOPLEFT"
},
"confidence": 0.916,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"37": {
"label": "table",
"id": 37,
"page_no": 12,
"cluster": {
"id": 37,
"label": "table",
"bbox": {
"l": 309.79,
"t": 253.91,
"r": 425.96,
"b": 292.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.528,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"lcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"6": {
"label": "table",
"id": 6,
"page_no": 12,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 83.95,
"t": 309.05,
"r": 239.17,
"b": 367.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.909,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"12": {
"label": "table",
"id": 12,
"page_no": 12,
"cluster": {
"id": 12,
"label": "table",
"bbox": {
"l": 335.27,
"t": 388.47,
"r": 490.08,
"b": 437.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.849,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"0": {
"label": "table",
"id": 0,
"page_no": 12,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 83.32,
"t": 396.01,
"r": 248.87,
"b": 487.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.961,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"10": {
"label": "table",
"id": 10,
"page_no": 12,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 334.93,
"t": 453.95,
"r": 490.09,
"b": 502.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"5": {
"label": "table",
"id": 5,
"page_no": 12,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 335.25,
"t": 519.08,
"r": 490.22,
"b": 567.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"30": {
"label": "table",
"id": 30,
"page_no": 12,
"cluster": {
"id": 30,
"label": "table",
"bbox": {
"l": 333.96,
"t": 593.11,
"r": 518.48,
"b": 665.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.593,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 14,
"page_no": 12,
"cluster": {
"id": 14,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 88.85,
"b": 84.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.755,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 88.85,
"r_y1": 84.11,
"r_x2": 88.85,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "phan cell.",
"orig": "phan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "phan cell."
},
{
"label": "text",
"id": 3,
"page_no": 12,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 87.16,
"r": 286.36,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.917,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 96.07,
"r_x1": 286.36,
"r_y1": 96.07,
"r_x2": 286.36,
"r_y2": 87.16,
"r_x3": 62.07,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "9f. Otherwise create a new structural cell and match it",
"orig": "9f. Otherwise create a new structural cell and match it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.02,
"r_x1": 127.03,
"r_y1": 108.02,
"r_x2": 127.03,
"r_y2": 99.12,
"r_x3": 50.11,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "wit the orphan cell.",
"orig": "wit the orphan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9f. Otherwise create a new structural cell and match it wit the orphan cell."
},
{
"label": "text",
"id": 1,
"page_no": 12,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 111.16,
"r": 286.36,
"b": 131.71,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 119.75,
"r_x1": 286.36,
"r_y1": 119.75,
"r_x2": 286.36,
"r_y2": 111.16,
"r_x3": 62.07,
"r_y3": 111.16,
"coord_origin": "TOPLEFT"
},
"text": "Aditional images with examples of TableFormer predic-",
"orig": "Aditional images with examples of TableFormer predic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.71,
"r_x1": 234.06,
"r_y1": 131.71,
"r_x2": 234.06,
"r_y2": 123.12,
"r_x3": 50.11,
"r_y3": 123.12,
"coord_origin": "TOPLEFT"
},
"text": "tions and post-processing can be found below.",
"orig": "tions and post-processing can be found below.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Aditional images with examples of TableFormer predictions and post-processing can be found below."
},
{
"label": "caption",
"id": 8,
"page_no": 12,
"cluster": {
"id": 8,
"label": "caption",
"bbox": {
"l": 63.34,
"t": 502.06,
"r": 273.13,
"b": 510.96,
"coord_origin": "TOPLEFT"
},
"confidence": 0.897,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.34,
"r_y0": 510.96,
"r_x1": 273.13,
"r_y1": 510.96,
"r_x2": 273.13,
"r_y2": 502.06,
"r_x3": 63.34,
"r_y3": 502.06,
"coord_origin": "TOPLEFT"
},
"text": "Figure 8: Example of a table with multi-line header.",
"orig": "Figure 8: Example of a table with multi-line header.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 8: Example of a table with multi-line header."
},
{
"label": "caption",
"id": 11,
"page_no": 12,
"cluster": {
"id": 11,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 306.6,
"r": 545.12,
"b": 327.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 315.5,
"r_x1": 345.63,
"r_y1": 315.5,
"r_x2": 345.63,
"r_y2": 306.6,
"r_x3": 308.86,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Figure 9:",
"orig": "Figure 9:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.79,
"r_y0": 315.5,
"r_x1": 545.12,
"r_y1": 315.5,
"r_x2": 545.12,
"r_y2": 306.6,
"r_x3": 352.79,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Example of a table with big empty distance be-",
"orig": "Example of a table with big empty distance be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 327.46,
"r_x1": 355.9,
"r_y1": 327.46,
"r_x2": 355.9,
"r_y2": 318.55,
"r_x3": 308.86,
"r_y3": 318.55,
"coord_origin": "TOPLEFT"
},
"text": "tween cells.",
"orig": "tween cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 9: Example of a table with big empty distance between cells."
},
{
"label": "caption",
"id": 2,
"page_no": 12,
"cluster": {
"id": 2,
"label": "caption",
"bbox": {
"l": 312.34,
"t": 680.49,
"r": 541.63,
"b": 689.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.919,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.34,
"r_y0": 689.4,
"r_x1": 541.63,
"r_y1": 689.4,
"r_x2": 541.63,
"r_y2": 680.49,
"r_x3": 312.34,
"r_y3": 680.49,
"coord_origin": "TOPLEFT"
},
"text": "Figure 10: Example of a complex table with empty cells.",
"orig": "Figure 10: Example of a complex table with empty cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 10: Example of a complex table with empty cells."
},
{
"label": "page_footer",
"id": 7,
"page_no": 12,
"cluster": {
"id": 7,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.902,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "13"
},
{
"label": "table",
"id": 17,
"page_no": 12,
"cluster": {
"id": 17,
"label": "table",
"bbox": {
"l": 310.33,
"t": 101.18,
"r": 555.83,
"b": 136.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.705,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 32,
"page_no": 12,
"cluster": {
"id": 32,
"label": "table",
"bbox": {
"l": 309.96,
"t": 154.61,
"r": 555.75,
"b": 184.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.564,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 9,
"page_no": 12,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 84.03,
"t": 156.33,
"r": 239.17,
"b": 214.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.886,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 21,
"page_no": 12,
"cluster": {
"id": 21,
"label": "table",
"bbox": {
"l": 309.96,
"t": 195.71,
"r": 555.71,
"b": 233.55,
"coord_origin": "TOPLEFT"
},
"confidence": 0.66,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 4,
"page_no": 12,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 82.92,
"t": 233.78,
"r": 239.19,
"b": 291.28,
"coord_origin": "TOPLEFT"
},
"confidence": 0.916,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 19,
"page_no": 12,
"cluster": {
"id": 19,
"label": "picture",
"bbox": {
"l": 309.79,
"t": 253.91,
"r": 425.96,
"b": 292.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.696,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 37,
"page_no": 12,
"cluster": {
"id": 37,
"label": "table",
"bbox": {
"l": 309.79,
"t": 253.91,
"r": 425.96,
"b": 292.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.528,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"lcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 6,
"page_no": 12,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 83.95,
"t": 309.05,
"r": 239.17,
"b": 367.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.909,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 12,
"page_no": 12,
"cluster": {
"id": 12,
"label": "table",
"bbox": {
"l": 335.27,
"t": 388.47,
"r": 490.08,
"b": 437.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.849,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 0,
"page_no": 12,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 83.32,
"t": 396.01,
"r": 248.87,
"b": 487.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.961,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 10,
"page_no": 12,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 334.93,
"t": 453.95,
"r": 490.09,
"b": 502.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 5,
"page_no": 12,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 335.25,
"t": 519.08,
"r": 490.22,
"b": 567.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 13,
"page_no": 12,
"cluster": {
"id": 13,
"label": "picture",
"bbox": {
"l": 333.96,
"t": 593.11,
"r": 518.48,
"b": 665.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.802,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 30,
"page_no": 12,
"cluster": {
"id": 30,
"label": "table",
"bbox": {
"l": 333.96,
"t": 593.11,
"r": 518.48,
"b": 665.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.593,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
],
"body": [
{
"label": "text",
"id": 14,
"page_no": 12,
"cluster": {
"id": 14,
"label": "text",
"bbox": {
"l": 50.11,
"t": 75.21,
"r": 88.85,
"b": 84.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.755,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 84.11,
"r_x1": 88.85,
"r_y1": 84.11,
"r_x2": 88.85,
"r_y2": 75.21,
"r_x3": 50.11,
"r_y3": 75.21,
"coord_origin": "TOPLEFT"
},
"text": "phan cell.",
"orig": "phan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "phan cell."
},
{
"label": "text",
"id": 3,
"page_no": 12,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.11,
"t": 87.16,
"r": 286.36,
"b": 108.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.917,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 96.07,
"r_x1": 286.36,
"r_y1": 96.07,
"r_x2": 286.36,
"r_y2": 87.16,
"r_x3": 62.07,
"r_y3": 87.16,
"coord_origin": "TOPLEFT"
},
"text": "9f. Otherwise create a new structural cell and match it",
"orig": "9f. Otherwise create a new structural cell and match it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 108.02,
"r_x1": 127.03,
"r_y1": 108.02,
"r_x2": 127.03,
"r_y2": 99.12,
"r_x3": 50.11,
"r_y3": 99.12,
"coord_origin": "TOPLEFT"
},
"text": "wit the orphan cell.",
"orig": "wit the orphan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9f. Otherwise create a new structural cell and match it wit the orphan cell."
},
{
"label": "text",
"id": 1,
"page_no": 12,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.11,
"t": 111.16,
"r": 286.36,
"b": 131.71,
"coord_origin": "TOPLEFT"
},
"confidence": 0.945,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.07,
"r_y0": 119.75,
"r_x1": 286.36,
"r_y1": 119.75,
"r_x2": 286.36,
"r_y2": 111.16,
"r_x3": 62.07,
"r_y3": 111.16,
"coord_origin": "TOPLEFT"
},
"text": "Aditional images with examples of TableFormer predic-",
"orig": "Aditional images with examples of TableFormer predic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 131.71,
"r_x1": 234.06,
"r_y1": 131.71,
"r_x2": 234.06,
"r_y2": 123.12,
"r_x3": 50.11,
"r_y3": 123.12,
"coord_origin": "TOPLEFT"
},
"text": "tions and post-processing can be found below.",
"orig": "tions and post-processing can be found below.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Aditional images with examples of TableFormer predictions and post-processing can be found below."
},
{
"label": "caption",
"id": 8,
"page_no": 12,
"cluster": {
"id": 8,
"label": "caption",
"bbox": {
"l": 63.34,
"t": 502.06,
"r": 273.13,
"b": 510.96,
"coord_origin": "TOPLEFT"
},
"confidence": 0.897,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.34,
"r_y0": 510.96,
"r_x1": 273.13,
"r_y1": 510.96,
"r_x2": 273.13,
"r_y2": 502.06,
"r_x3": 63.34,
"r_y3": 502.06,
"coord_origin": "TOPLEFT"
},
"text": "Figure 8: Example of a table with multi-line header.",
"orig": "Figure 8: Example of a table with multi-line header.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 8: Example of a table with multi-line header."
},
{
"label": "caption",
"id": 11,
"page_no": 12,
"cluster": {
"id": 11,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 306.6,
"r": 545.12,
"b": 327.46,
"coord_origin": "TOPLEFT"
},
"confidence": 0.877,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 315.5,
"r_x1": 345.63,
"r_y1": 315.5,
"r_x2": 345.63,
"r_y2": 306.6,
"r_x3": 308.86,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Figure 9:",
"orig": "Figure 9:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.79,
"r_y0": 315.5,
"r_x1": 545.12,
"r_y1": 315.5,
"r_x2": 545.12,
"r_y2": 306.6,
"r_x3": 352.79,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Example of a table with big empty distance be-",
"orig": "Example of a table with big empty distance be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 327.46,
"r_x1": 355.9,
"r_y1": 327.46,
"r_x2": 355.9,
"r_y2": 318.55,
"r_x3": 308.86,
"r_y3": 318.55,
"coord_origin": "TOPLEFT"
},
"text": "tween cells.",
"orig": "tween cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 9: Example of a table with big empty distance between cells."
},
{
"label": "caption",
"id": 2,
"page_no": 12,
"cluster": {
"id": 2,
"label": "caption",
"bbox": {
"l": 312.34,
"t": 680.49,
"r": 541.63,
"b": 689.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.919,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.34,
"r_y0": 689.4,
"r_x1": 541.63,
"r_y1": 689.4,
"r_x2": 541.63,
"r_y2": 680.49,
"r_x3": 312.34,
"r_y3": 680.49,
"coord_origin": "TOPLEFT"
},
"text": "Figure 10: Example of a complex table with empty cells.",
"orig": "Figure 10: Example of a complex table with empty cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 10: Example of a complex table with empty cells."
},
{
"label": "table",
"id": 17,
"page_no": 12,
"cluster": {
"id": 17,
"label": "table",
"bbox": {
"l": 310.33,
"t": 101.18,
"r": 555.83,
"b": 136.15,
"coord_origin": "TOPLEFT"
},
"confidence": 0.705,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 32,
"page_no": 12,
"cluster": {
"id": 32,
"label": "table",
"bbox": {
"l": 309.96,
"t": 154.61,
"r": 555.75,
"b": 184.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.564,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 9,
"page_no": 12,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 84.03,
"t": 156.33,
"r": 239.17,
"b": 214.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.886,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 21,
"page_no": 12,
"cluster": {
"id": 21,
"label": "table",
"bbox": {
"l": 309.96,
"t": 195.71,
"r": 555.71,
"b": 233.55,
"coord_origin": "TOPLEFT"
},
"confidence": 0.66,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 4,
"page_no": 12,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 82.92,
"t": 233.78,
"r": 239.19,
"b": 291.28,
"coord_origin": "TOPLEFT"
},
"confidence": 0.916,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 19,
"page_no": 12,
"cluster": {
"id": 19,
"label": "picture",
"bbox": {
"l": 309.79,
"t": 253.91,
"r": 425.96,
"b": 292.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.696,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 37,
"page_no": 12,
"cluster": {
"id": 37,
"label": "table",
"bbox": {
"l": 309.79,
"t": 253.91,
"r": 425.96,
"b": 292.39,
"coord_origin": "TOPLEFT"
},
"confidence": 0.528,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"lcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 6,
"page_no": 12,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 83.95,
"t": 309.05,
"r": 239.17,
"b": 367.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.909,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 12,
"page_no": 12,
"cluster": {
"id": 12,
"label": "table",
"bbox": {
"l": 335.27,
"t": 388.47,
"r": 490.08,
"b": 437.02,
"coord_origin": "TOPLEFT"
},
"confidence": 0.849,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 0,
"page_no": 12,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 83.32,
"t": 396.01,
"r": 248.87,
"b": 487.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.961,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 10,
"page_no": 12,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 334.93,
"t": 453.95,
"r": 490.09,
"b": 502.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.882,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 5,
"page_no": 12,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 335.25,
"t": 519.08,
"r": 490.22,
"b": 567.69,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 13,
"page_no": 12,
"cluster": {
"id": 13,
"label": "picture",
"bbox": {
"l": 333.96,
"t": 593.11,
"r": 518.48,
"b": 665.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.802,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 30,
"page_no": 12,
"cluster": {
"id": 30,
"label": "table",
"bbox": {
"l": 333.96,
"t": 593.11,
"r": 518.48,
"b": 665.49,
"coord_origin": "TOPLEFT"
},
"confidence": 0.593,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
],
"headers": [
{
"label": "page_footer",
"id": 7,
"page_no": 12,
"cluster": {
"id": 7,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.902,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "13"
}
]
}
},
{
"page_no": 13,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 365.68,
"r_x1": 93.05,
"r_y1": 365.68,
"r_x2": 93.05,
"r_y2": 356.77,
"r_x3": 50.11,
"r_y3": 356.77,
"coord_origin": "TOPLEFT"
},
"text": "Figure 11:",
"orig": "Figure 11:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.73,
"r_y0": 365.68,
"r_x1": 286.37,
"r_y1": 365.68,
"r_x2": 286.37,
"r_y2": 356.77,
"r_x3": 103.73,
"r_y3": 356.77,
"coord_origin": "TOPLEFT"
},
"text": "Simple table with different style and empty",
"orig": "Simple table with different style and empty",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 377.63,
"r_x1": 70.86,
"r_y1": 377.63,
"r_x2": 70.86,
"r_y2": 368.73,
"r_x3": 50.11,
"r_y3": 368.73,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.62,
"r_y0": 680.72,
"r_x1": 281.86,
"r_y1": 680.72,
"r_x2": 281.86,
"r_y2": 671.82,
"r_x3": 54.62,
"r_y3": 671.82,
"coord_origin": "TOPLEFT"
},
"text": "Figure 12: Simple table predictions and post processing.",
"orig": "Figure 12: Simple table predictions and post processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.79,
"r_y0": 380.59,
"r_x1": 538.19,
"r_y1": 380.59,
"r_x2": 538.19,
"r_y2": 371.68,
"r_x3": 315.79,
"r_y3": 371.68,
"coord_origin": "TOPLEFT"
},
"text": "Figure 13: Table predictions example on colorful table.",
"orig": "Figure 13: Table predictions example on colorful table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 344.98,
"r_y0": 692.45,
"r_x1": 508.99,
"r_y1": 692.45,
"r_x2": 508.99,
"r_y2": 683.55,
"r_x3": 344.98,
"r_y3": 683.55,
"coord_origin": "TOPLEFT"
},
"text": "Figure 14: Example with multi-line text.",
"orig": "Figure 14: Example with multi-line text.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 0,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 356.77,
"r": 286.37,
"b": 377.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.951,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 365.68,
"r_x1": 93.05,
"r_y1": 365.68,
"r_x2": 93.05,
"r_y2": 356.77,
"r_x3": 50.11,
"r_y3": 356.77,
"coord_origin": "TOPLEFT"
},
"text": "Figure 11:",
"orig": "Figure 11:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.73,
"r_y0": 365.68,
"r_x1": 286.37,
"r_y1": 365.68,
"r_x2": 286.37,
"r_y2": 356.77,
"r_x3": 103.73,
"r_y3": 356.77,
"coord_origin": "TOPLEFT"
},
"text": "Simple table with different style and empty",
"orig": "Simple table with different style and empty",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 377.63,
"r_x1": 70.86,
"r_y1": 377.63,
"r_x2": 70.86,
"r_y2": 368.73,
"r_x3": 50.11,
"r_y3": 368.73,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "caption",
"bbox": {
"l": 54.62,
"t": 671.82,
"r": 281.86,
"b": 680.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.62,
"r_y0": 680.72,
"r_x1": 281.86,
"r_y1": 680.72,
"r_x2": 281.86,
"r_y2": 671.82,
"r_x3": 54.62,
"r_y3": 671.82,
"coord_origin": "TOPLEFT"
},
"text": "Figure 12: Simple table predictions and post processing.",
"orig": "Figure 12: Simple table predictions and post processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "caption",
"bbox": {
"l": 315.79,
"t": 371.68,
"r": 538.19,
"b": 380.59,
"coord_origin": "TOPLEFT"
},
"confidence": 0.918,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.79,
"r_y0": 380.59,
"r_x1": 538.19,
"r_y1": 380.59,
"r_x2": 538.19,
"r_y2": 371.68,
"r_x3": 315.79,
"r_y3": 371.68,
"coord_origin": "TOPLEFT"
},
"text": "Figure 13: Table predictions example on colorful table.",
"orig": "Figure 13: Table predictions example on colorful table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "caption",
"bbox": {
"l": 344.98,
"t": 683.55,
"r": 508.99,
"b": 692.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.919,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 344.98,
"r_y0": 692.45,
"r_x1": 508.99,
"r_y1": 692.45,
"r_x2": 508.99,
"r_y2": 683.55,
"r_x3": 344.98,
"r_y3": 683.55,
"coord_origin": "TOPLEFT"
},
"text": "Figure 14: Example with multi-line text.",
"orig": "Figure 14: Example with multi-line text.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.888,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "picture",
"bbox": {
"l": 318.63,
"t": 90.88,
"r": 534.74,
"b": 359.06,
"coord_origin": "TOPLEFT"
},
"confidence": 0.5,
"cells": [],
"children": []
},
{
"id": 30,
"label": "picture",
"bbox": {
"l": 51.15,
"t": 104.31,
"r": 282.86,
"b": 344.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.561,
"cells": [],
"children": []
},
{
"id": 23,
"label": "table",
"bbox": {
"l": 318.98,
"t": 161.23,
"r": 534.62,
"b": 214.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.624,
"cells": [],
"children": []
},
{
"id": 33,
"label": "table",
"bbox": {
"l": 319.01,
"t": 226.11,
"r": 534.41,
"b": 279.86,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
{
"id": 27,
"label": "table",
"bbox": {
"l": 51.73,
"t": 273.61,
"r": 283.11,
"b": 344.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
{
"id": 38,
"label": "table",
"bbox": {
"l": 328.14,
"t": 288.68,
"r": 523.89,
"b": 358.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.523,
"cells": [],
"children": []
},
{
"id": 10,
"label": "table",
"bbox": {
"l": 319.47,
"t": 430.9,
"r": 518.57,
"b": 477.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.838,
"cells": [],
"children": []
},
{
"id": 9,
"label": "table",
"bbox": {
"l": 51.43,
"t": 453.49,
"r": 310.73,
"b": 491.82,
"coord_origin": "TOPLEFT"
},
"confidence": 0.842,
"cells": [],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 319.98,
"t": 489.24,
"r": 519.1,
"b": 535.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
{
"id": 4,
"label": "table",
"bbox": {
"l": 50.87,
"t": 504.1,
"r": 310.61,
"b": 542.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.892,
"cells": [],
"children": []
},
{
"id": 15,
"label": "table",
"bbox": {
"l": 319.83,
"t": 546.41,
"r": 519.61,
"b": 593.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.682,
"cells": [],
"children": []
},
{
"id": 6,
"label": "table",
"bbox": {
"l": 51.27,
"t": 553.73,
"r": 311.09,
"b": 591.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.887,
"cells": [],
"children": []
},
{
"id": 7,
"label": "table",
"bbox": {
"l": 319.06,
"t": 609.84,
"r": 533.77,
"b": 669.19,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [],
"children": []
},
{
"id": 11,
"label": "picture",
"bbox": {
"l": 50.4,
"t": 611.0,
"r": 177.06,
"b": 656.16,
"coord_origin": "TOPLEFT"
},
"confidence": 0.787,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"23": {
"label": "table",
"id": 23,
"page_no": 13,
"cluster": {
"id": 23,
"label": "table",
"bbox": {
"l": 318.98,
"t": 161.23,
"r": 534.62,
"b": 214.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.624,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"33": {
"label": "table",
"id": 33,
"page_no": 13,
"cluster": {
"id": 33,
"label": "table",
"bbox": {
"l": 319.01,
"t": 226.11,
"r": 534.41,
"b": 279.86,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"27": {
"label": "table",
"id": 27,
"page_no": 13,
"cluster": {
"id": 27,
"label": "table",
"bbox": {
"l": 51.73,
"t": 273.61,
"r": 283.11,
"b": 344.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"ecel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"38": {
"label": "table",
"id": 38,
"page_no": 13,
"cluster": {
"id": 38,
"label": "table",
"bbox": {
"l": 328.14,
"t": 288.68,
"r": 523.89,
"b": 358.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.523,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"10": {
"label": "table",
"id": 10,
"page_no": 13,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 319.47,
"t": 430.9,
"r": 518.57,
"b": 477.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.838,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"9": {
"label": "table",
"id": 9,
"page_no": 13,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 51.43,
"t": 453.49,
"r": 310.73,
"b": 491.82,
"coord_origin": "TOPLEFT"
},
"confidence": 0.842,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"8": {
"label": "table",
"id": 8,
"page_no": 13,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 319.98,
"t": 489.24,
"r": 519.1,
"b": 535.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"4": {
"label": "table",
"id": 4,
"page_no": 13,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 50.87,
"t": 504.1,
"r": 310.61,
"b": 542.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.892,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"15": {
"label": "table",
"id": 15,
"page_no": 13,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 319.83,
"t": 546.41,
"r": 519.61,
"b": 593.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.682,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"6": {
"label": "table",
"id": 6,
"page_no": 13,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 51.27,
"t": 553.73,
"r": 311.09,
"b": 591.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.887,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"7": {
"label": "table",
"id": 7,
"page_no": 13,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 319.06,
"t": 609.84,
"r": 533.77,
"b": 669.19,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "caption",
"id": 0,
"page_no": 13,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 356.77,
"r": 286.37,
"b": 377.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.951,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 365.68,
"r_x1": 93.05,
"r_y1": 365.68,
"r_x2": 93.05,
"r_y2": 356.77,
"r_x3": 50.11,
"r_y3": 356.77,
"coord_origin": "TOPLEFT"
},
"text": "Figure 11:",
"orig": "Figure 11:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.73,
"r_y0": 365.68,
"r_x1": 286.37,
"r_y1": 365.68,
"r_x2": 286.37,
"r_y2": 356.77,
"r_x3": 103.73,
"r_y3": 356.77,
"coord_origin": "TOPLEFT"
},
"text": "Simple table with different style and empty",
"orig": "Simple table with different style and empty",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 377.63,
"r_x1": 70.86,
"r_y1": 377.63,
"r_x2": 70.86,
"r_y2": 368.73,
"r_x3": 50.11,
"r_y3": 368.73,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 11: Simple table with different style and empty cells."
},
{
"label": "caption",
"id": 1,
"page_no": 13,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 54.62,
"t": 671.82,
"r": 281.86,
"b": 680.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.62,
"r_y0": 680.72,
"r_x1": 281.86,
"r_y1": 680.72,
"r_x2": 281.86,
"r_y2": 671.82,
"r_x3": 54.62,
"r_y3": 671.82,
"coord_origin": "TOPLEFT"
},
"text": "Figure 12: Simple table predictions and post processing.",
"orig": "Figure 12: Simple table predictions and post processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 12: Simple table predictions and post processing."
},
{
"label": "caption",
"id": 3,
"page_no": 13,
"cluster": {
"id": 3,
"label": "caption",
"bbox": {
"l": 315.79,
"t": 371.68,
"r": 538.19,
"b": 380.59,
"coord_origin": "TOPLEFT"
},
"confidence": 0.918,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.79,
"r_y0": 380.59,
"r_x1": 538.19,
"r_y1": 380.59,
"r_x2": 538.19,
"r_y2": 371.68,
"r_x3": 315.79,
"r_y3": 371.68,
"coord_origin": "TOPLEFT"
},
"text": "Figure 13: Table predictions example on colorful table.",
"orig": "Figure 13: Table predictions example on colorful table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 13: Table predictions example on colorful table."
},
{
"label": "caption",
"id": 2,
"page_no": 13,
"cluster": {
"id": 2,
"label": "caption",
"bbox": {
"l": 344.98,
"t": 683.55,
"r": 508.99,
"b": 692.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.919,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 344.98,
"r_y0": 692.45,
"r_x1": 508.99,
"r_y1": 692.45,
"r_x2": 508.99,
"r_y2": 683.55,
"r_x3": 344.98,
"r_y3": 683.55,
"coord_origin": "TOPLEFT"
},
"text": "Figure 14: Example with multi-line text.",
"orig": "Figure 14: Example with multi-line text.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 14: Example with multi-line text."
},
{
"label": "page_footer",
"id": 5,
"page_no": 13,
"cluster": {
"id": 5,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.888,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "14"
},
{
"label": "picture",
"id": 41,
"page_no": 13,
"cluster": {
"id": 41,
"label": "picture",
"bbox": {
"l": 318.63,
"t": 90.88,
"r": 534.74,
"b": 359.06,
"coord_origin": "TOPLEFT"
},
"confidence": 0.5,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 30,
"page_no": 13,
"cluster": {
"id": 30,
"label": "picture",
"bbox": {
"l": 51.15,
"t": 104.31,
"r": 282.86,
"b": 344.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.561,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 23,
"page_no": 13,
"cluster": {
"id": 23,
"label": "table",
"bbox": {
"l": 318.98,
"t": 161.23,
"r": 534.62,
"b": 214.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.624,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 33,
"page_no": 13,
"cluster": {
"id": 33,
"label": "table",
"bbox": {
"l": 319.01,
"t": 226.11,
"r": 534.41,
"b": 279.86,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 27,
"page_no": 13,
"cluster": {
"id": 27,
"label": "table",
"bbox": {
"l": 51.73,
"t": 273.61,
"r": 283.11,
"b": 344.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"ecel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 38,
"page_no": 13,
"cluster": {
"id": 38,
"label": "table",
"bbox": {
"l": 328.14,
"t": 288.68,
"r": 523.89,
"b": 358.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.523,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 10,
"page_no": 13,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 319.47,
"t": 430.9,
"r": 518.57,
"b": 477.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.838,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 9,
"page_no": 13,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 51.43,
"t": 453.49,
"r": 310.73,
"b": 491.82,
"coord_origin": "TOPLEFT"
},
"confidence": 0.842,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 8,
"page_no": 13,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 319.98,
"t": 489.24,
"r": 519.1,
"b": 535.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 4,
"page_no": 13,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 50.87,
"t": 504.1,
"r": 310.61,
"b": 542.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.892,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 15,
"page_no": 13,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 319.83,
"t": 546.41,
"r": 519.61,
"b": 593.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.682,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 6,
"page_no": 13,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 51.27,
"t": 553.73,
"r": 311.09,
"b": 591.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.887,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 7,
"page_no": 13,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 319.06,
"t": 609.84,
"r": 533.77,
"b": 669.19,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 11,
"page_no": 13,
"cluster": {
"id": 11,
"label": "picture",
"bbox": {
"l": 50.4,
"t": 611.0,
"r": 177.06,
"b": 656.16,
"coord_origin": "TOPLEFT"
},
"confidence": 0.787,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"body": [
{
"label": "caption",
"id": 0,
"page_no": 13,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 356.77,
"r": 286.37,
"b": 377.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.951,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 365.68,
"r_x1": 93.05,
"r_y1": 365.68,
"r_x2": 93.05,
"r_y2": 356.77,
"r_x3": 50.11,
"r_y3": 356.77,
"coord_origin": "TOPLEFT"
},
"text": "Figure 11:",
"orig": "Figure 11:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.73,
"r_y0": 365.68,
"r_x1": 286.37,
"r_y1": 365.68,
"r_x2": 286.37,
"r_y2": 356.77,
"r_x3": 103.73,
"r_y3": 356.77,
"coord_origin": "TOPLEFT"
},
"text": "Simple table with different style and empty",
"orig": "Simple table with different style and empty",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 377.63,
"r_x1": 70.86,
"r_y1": 377.63,
"r_x2": 70.86,
"r_y2": 368.73,
"r_x3": 50.11,
"r_y3": 368.73,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 11: Simple table with different style and empty cells."
},
{
"label": "caption",
"id": 1,
"page_no": 13,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 54.62,
"t": 671.82,
"r": 281.86,
"b": 680.72,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.62,
"r_y0": 680.72,
"r_x1": 281.86,
"r_y1": 680.72,
"r_x2": 281.86,
"r_y2": 671.82,
"r_x3": 54.62,
"r_y3": 671.82,
"coord_origin": "TOPLEFT"
},
"text": "Figure 12: Simple table predictions and post processing.",
"orig": "Figure 12: Simple table predictions and post processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 12: Simple table predictions and post processing."
},
{
"label": "caption",
"id": 3,
"page_no": 13,
"cluster": {
"id": 3,
"label": "caption",
"bbox": {
"l": 315.79,
"t": 371.68,
"r": 538.19,
"b": 380.59,
"coord_origin": "TOPLEFT"
},
"confidence": 0.918,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.79,
"r_y0": 380.59,
"r_x1": 538.19,
"r_y1": 380.59,
"r_x2": 538.19,
"r_y2": 371.68,
"r_x3": 315.79,
"r_y3": 371.68,
"coord_origin": "TOPLEFT"
},
"text": "Figure 13: Table predictions example on colorful table.",
"orig": "Figure 13: Table predictions example on colorful table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 13: Table predictions example on colorful table."
},
{
"label": "caption",
"id": 2,
"page_no": 13,
"cluster": {
"id": 2,
"label": "caption",
"bbox": {
"l": 344.98,
"t": 683.55,
"r": 508.99,
"b": 692.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.919,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 344.98,
"r_y0": 692.45,
"r_x1": 508.99,
"r_y1": 692.45,
"r_x2": 508.99,
"r_y2": 683.55,
"r_x3": 344.98,
"r_y3": 683.55,
"coord_origin": "TOPLEFT"
},
"text": "Figure 14: Example with multi-line text.",
"orig": "Figure 14: Example with multi-line text.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 14: Example with multi-line text."
},
{
"label": "picture",
"id": 41,
"page_no": 13,
"cluster": {
"id": 41,
"label": "picture",
"bbox": {
"l": 318.63,
"t": 90.88,
"r": 534.74,
"b": 359.06,
"coord_origin": "TOPLEFT"
},
"confidence": 0.5,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 30,
"page_no": 13,
"cluster": {
"id": 30,
"label": "picture",
"bbox": {
"l": 51.15,
"t": 104.31,
"r": 282.86,
"b": 344.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.561,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 23,
"page_no": 13,
"cluster": {
"id": 23,
"label": "table",
"bbox": {
"l": 318.98,
"t": 161.23,
"r": 534.62,
"b": 214.63,
"coord_origin": "TOPLEFT"
},
"confidence": 0.624,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 33,
"page_no": 13,
"cluster": {
"id": 33,
"label": "table",
"bbox": {
"l": 319.01,
"t": 226.11,
"r": 534.41,
"b": 279.86,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 27,
"page_no": 13,
"cluster": {
"id": 27,
"label": "table",
"bbox": {
"l": 51.73,
"t": 273.61,
"r": 283.11,
"b": 344.24,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"ecel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 38,
"page_no": 13,
"cluster": {
"id": 38,
"label": "table",
"bbox": {
"l": 328.14,
"t": 288.68,
"r": 523.89,
"b": 358.27,
"coord_origin": "TOPLEFT"
},
"confidence": 0.523,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 10,
"page_no": 13,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 319.47,
"t": 430.9,
"r": 518.57,
"b": 477.94,
"coord_origin": "TOPLEFT"
},
"confidence": 0.838,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 9,
"page_no": 13,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 51.43,
"t": 453.49,
"r": 310.73,
"b": 491.82,
"coord_origin": "TOPLEFT"
},
"confidence": 0.842,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 8,
"page_no": 13,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 319.98,
"t": 489.24,
"r": 519.1,
"b": 535.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 4,
"page_no": 13,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 50.87,
"t": 504.1,
"r": 310.61,
"b": 542.45,
"coord_origin": "TOPLEFT"
},
"confidence": 0.892,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 15,
"page_no": 13,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 319.83,
"t": 546.41,
"r": 519.61,
"b": 593.11,
"coord_origin": "TOPLEFT"
},
"confidence": 0.682,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 6,
"page_no": 13,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 51.27,
"t": 553.73,
"r": 311.09,
"b": 591.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.887,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 7,
"page_no": 13,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 319.06,
"t": 609.84,
"r": 533.77,
"b": 669.19,
"coord_origin": "TOPLEFT"
},
"confidence": 0.872,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 11,
"page_no": 13,
"cluster": {
"id": 11,
"label": "picture",
"bbox": {
"l": 50.4,
"t": 611.0,
"r": 177.06,
"b": 656.16,
"coord_origin": "TOPLEFT"
},
"confidence": 0.787,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"headers": [
{
"label": "page_footer",
"id": 5,
"page_no": 13,
"cluster": {
"id": 5,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.888,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "14"
}
]
}
},
{
"page_no": 14,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 84.23,
"r_y0": 653.26,
"r_x1": 252.24,
"r_y1": 653.26,
"r_x2": 252.24,
"r_y2": 644.35,
"r_x3": 84.23,
"r_y3": 644.35,
"coord_origin": "TOPLEFT"
},
"text": "Figure 15: Example with triangular table.",
"orig": "Figure 15: Example with triangular table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 661.84,
"r_x1": 545.12,
"r_y1": 661.84,
"r_x2": 545.12,
"r_y2": 652.94,
"r_x3": 308.86,
"r_y3": 652.94,
"coord_origin": "TOPLEFT"
},
"text": "Figure 16: Example of how post-processing helps to restore",
"orig": "Figure 16: Example of how post-processing helps to restore",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 673.8,
"r_x1": 497.6,
"r_y1": 673.8,
"r_x2": 497.6,
"r_y2": 664.89,
"r_x3": 308.86,
"r_y3": 664.89,
"coord_origin": "TOPLEFT"
},
"text": "mis-aligned bounding boxes prediction artifact.",
"orig": "mis-aligned bounding boxes prediction artifact.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 0,
"label": "caption",
"bbox": {
"l": 84.23,
"t": 644.35,
"r": 252.24,
"b": 653.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 84.23,
"r_y0": 653.26,
"r_x1": 252.24,
"r_y1": 653.26,
"r_x2": 252.24,
"r_y2": 644.35,
"r_x3": 84.23,
"r_y3": 644.35,
"coord_origin": "TOPLEFT"
},
"text": "Figure 15: Example with triangular table.",
"orig": "Figure 15: Example with triangular table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 652.94,
"r": 545.12,
"b": 673.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 661.84,
"r_x1": 545.12,
"r_y1": 661.84,
"r_x2": 545.12,
"r_y2": 652.94,
"r_x3": 308.86,
"r_y3": 652.94,
"coord_origin": "TOPLEFT"
},
"text": "Figure 16: Example of how post-processing helps to restore",
"orig": "Figure 16: Example of how post-processing helps to restore",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 673.8,
"r_x1": 497.6,
"r_y1": 673.8,
"r_x2": 497.6,
"r_y2": 664.89,
"r_x3": 308.86,
"r_y3": 664.89,
"coord_origin": "TOPLEFT"
},
"text": "mis-aligned bounding boxes prediction artifact.",
"orig": "mis-aligned bounding boxes prediction artifact.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.904,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "table",
"bbox": {
"l": 323.01,
"t": 121.55,
"r": 525.95,
"b": 222.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [],
"children": []
},
{
"id": 6,
"label": "picture",
"bbox": {
"l": 55.12,
"t": 136.26,
"r": 279.37,
"b": 249.33,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
{
"id": 19,
"label": "table",
"bbox": {
"l": 55.12,
"t": 136.26,
"r": 279.37,
"b": 249.33,
"coord_origin": "TOPLEFT"
},
"confidence": 0.558,
"cells": [],
"children": []
},
{
"id": 2,
"label": "table",
"bbox": {
"l": 323.38,
"t": 241.97,
"r": 526.13,
"b": 344.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.906,
"cells": [],
"children": []
},
{
"id": 18,
"label": "picture",
"bbox": {
"l": 54.28,
"t": 260.26,
"r": 279.26,
"b": 373.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.567,
"cells": [],
"children": []
},
{
"id": 10,
"label": "table",
"bbox": {
"l": 54.28,
"t": 260.26,
"r": 279.26,
"b": 373.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.775,
"cells": [],
"children": []
},
{
"id": 20,
"label": "picture",
"bbox": {
"l": 323.47,
"t": 362.45,
"r": 525.96,
"b": 464.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.552,
"cells": [],
"children": []
},
{
"id": 9,
"label": "table",
"bbox": {
"l": 323.47,
"t": 362.45,
"r": 525.96,
"b": 464.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.776,
"cells": [],
"children": []
},
{
"id": 5,
"label": "picture",
"bbox": {
"l": 55.42,
"t": 384.56,
"r": 280.23,
"b": 497.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.841,
"cells": [],
"children": []
},
{
"id": 22,
"label": "picture",
"bbox": {
"l": 353.69,
"t": 487.41,
"r": 495.43,
"b": 635.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.548,
"cells": [],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 353.69,
"t": 487.41,
"r": 495.43,
"b": 635.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.781,
"cells": [],
"children": []
},
{
"id": 7,
"label": "picture",
"bbox": {
"l": 50.65,
"t": 505.98,
"r": 319.91,
"b": 631.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [],
"children": []
},
{
"id": 11,
"label": "table",
"bbox": {
"l": 50.65,
"t": 505.98,
"r": 319.91,
"b": 631.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.684,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"4": {
"label": "table",
"id": 4,
"page_no": 14,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 323.01,
"t": 121.55,
"r": 525.95,
"b": 222.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"19": {
"label": "table",
"id": 19,
"page_no": 14,
"cluster": {
"id": 19,
"label": "table",
"bbox": {
"l": 55.12,
"t": 136.26,
"r": 279.37,
"b": 249.33,
"coord_origin": "TOPLEFT"
},
"confidence": 0.558,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"2": {
"label": "table",
"id": 2,
"page_no": 14,
"cluster": {
"id": 2,
"label": "table",
"bbox": {
"l": 323.38,
"t": 241.97,
"r": 526.13,
"b": 344.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.906,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"10": {
"label": "table",
"id": 10,
"page_no": 14,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 54.28,
"t": 260.26,
"r": 279.26,
"b": 373.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.775,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"9": {
"label": "table",
"id": 9,
"page_no": 14,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 323.47,
"t": 362.45,
"r": 525.96,
"b": 464.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.776,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"8": {
"label": "table",
"id": 8,
"page_no": 14,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 353.69,
"t": 487.41,
"r": 495.43,
"b": 635.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.781,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"11": {
"label": "table",
"id": 11,
"page_no": 14,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 50.65,
"t": 505.98,
"r": 319.91,
"b": 631.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.684,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "caption",
"id": 0,
"page_no": 14,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 84.23,
"t": 644.35,
"r": 252.24,
"b": 653.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 84.23,
"r_y0": 653.26,
"r_x1": 252.24,
"r_y1": 653.26,
"r_x2": 252.24,
"r_y2": 644.35,
"r_x3": 84.23,
"r_y3": 644.35,
"coord_origin": "TOPLEFT"
},
"text": "Figure 15: Example with triangular table.",
"orig": "Figure 15: Example with triangular table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 15: Example with triangular table."
},
{
"label": "caption",
"id": 1,
"page_no": 14,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 652.94,
"r": 545.12,
"b": 673.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 661.84,
"r_x1": 545.12,
"r_y1": 661.84,
"r_x2": 545.12,
"r_y2": 652.94,
"r_x3": 308.86,
"r_y3": 652.94,
"coord_origin": "TOPLEFT"
},
"text": "Figure 16: Example of how post-processing helps to restore",
"orig": "Figure 16: Example of how post-processing helps to restore",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 673.8,
"r_x1": 497.6,
"r_y1": 673.8,
"r_x2": 497.6,
"r_y2": 664.89,
"r_x3": 308.86,
"r_y3": 664.89,
"coord_origin": "TOPLEFT"
},
"text": "mis-aligned bounding boxes prediction artifact.",
"orig": "mis-aligned bounding boxes prediction artifact.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact."
},
{
"label": "page_footer",
"id": 3,
"page_no": 14,
"cluster": {
"id": 3,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.904,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "15"
},
{
"label": "table",
"id": 4,
"page_no": 14,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 323.01,
"t": 121.55,
"r": 525.95,
"b": 222.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 6,
"page_no": 14,
"cluster": {
"id": 6,
"label": "picture",
"bbox": {
"l": 55.12,
"t": 136.26,
"r": 279.37,
"b": 249.33,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 19,
"page_no": 14,
"cluster": {
"id": 19,
"label": "table",
"bbox": {
"l": 55.12,
"t": 136.26,
"r": 279.37,
"b": 249.33,
"coord_origin": "TOPLEFT"
},
"confidence": 0.558,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 2,
"page_no": 14,
"cluster": {
"id": 2,
"label": "table",
"bbox": {
"l": 323.38,
"t": 241.97,
"r": 526.13,
"b": 344.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.906,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 18,
"page_no": 14,
"cluster": {
"id": 18,
"label": "picture",
"bbox": {
"l": 54.28,
"t": 260.26,
"r": 279.26,
"b": 373.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.567,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 10,
"page_no": 14,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 54.28,
"t": 260.26,
"r": 279.26,
"b": 373.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.775,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 20,
"page_no": 14,
"cluster": {
"id": 20,
"label": "picture",
"bbox": {
"l": 323.47,
"t": 362.45,
"r": 525.96,
"b": 464.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.552,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 9,
"page_no": 14,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 323.47,
"t": 362.45,
"r": 525.96,
"b": 464.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.776,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 5,
"page_no": 14,
"cluster": {
"id": 5,
"label": "picture",
"bbox": {
"l": 55.42,
"t": 384.56,
"r": 280.23,
"b": 497.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.841,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 22,
"page_no": 14,
"cluster": {
"id": 22,
"label": "picture",
"bbox": {
"l": 353.69,
"t": 487.41,
"r": 495.43,
"b": 635.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.548,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 8,
"page_no": 14,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 353.69,
"t": 487.41,
"r": 495.43,
"b": 635.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.781,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 7,
"page_no": 14,
"cluster": {
"id": 7,
"label": "picture",
"bbox": {
"l": 50.65,
"t": 505.98,
"r": 319.91,
"b": 631.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 11,
"page_no": 14,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 50.65,
"t": 505.98,
"r": 319.91,
"b": 631.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.684,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
],
"body": [
{
"label": "caption",
"id": 0,
"page_no": 14,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 84.23,
"t": 644.35,
"r": 252.24,
"b": 653.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.926,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 84.23,
"r_y0": 653.26,
"r_x1": 252.24,
"r_y1": 653.26,
"r_x2": 252.24,
"r_y2": 644.35,
"r_x3": 84.23,
"r_y3": 644.35,
"coord_origin": "TOPLEFT"
},
"text": "Figure 15: Example with triangular table.",
"orig": "Figure 15: Example with triangular table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 15: Example with triangular table."
},
{
"label": "caption",
"id": 1,
"page_no": 14,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 308.86,
"t": 652.94,
"r": 545.12,
"b": 673.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 661.84,
"r_x1": 545.12,
"r_y1": 661.84,
"r_x2": 545.12,
"r_y2": 652.94,
"r_x3": 308.86,
"r_y3": 652.94,
"coord_origin": "TOPLEFT"
},
"text": "Figure 16: Example of how post-processing helps to restore",
"orig": "Figure 16: Example of how post-processing helps to restore",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.86,
"r_y0": 673.8,
"r_x1": 497.6,
"r_y1": 673.8,
"r_x2": 497.6,
"r_y2": 664.89,
"r_x3": 308.86,
"r_y3": 664.89,
"coord_origin": "TOPLEFT"
},
"text": "mis-aligned bounding boxes prediction artifact.",
"orig": "mis-aligned bounding boxes prediction artifact.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact."
},
{
"label": "table",
"id": 4,
"page_no": 14,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 323.01,
"t": 121.55,
"r": 525.95,
"b": 222.91,
"coord_origin": "TOPLEFT"
},
"confidence": 0.857,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 6,
"page_no": 14,
"cluster": {
"id": 6,
"label": "picture",
"bbox": {
"l": 55.12,
"t": 136.26,
"r": 279.37,
"b": 249.33,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 19,
"page_no": 14,
"cluster": {
"id": 19,
"label": "table",
"bbox": {
"l": 55.12,
"t": 136.26,
"r": 279.37,
"b": 249.33,
"coord_origin": "TOPLEFT"
},
"confidence": 0.558,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 2,
"page_no": 14,
"cluster": {
"id": 2,
"label": "table",
"bbox": {
"l": 323.38,
"t": 241.97,
"r": 526.13,
"b": 344.09,
"coord_origin": "TOPLEFT"
},
"confidence": 0.906,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 18,
"page_no": 14,
"cluster": {
"id": 18,
"label": "picture",
"bbox": {
"l": 54.28,
"t": 260.26,
"r": 279.26,
"b": 373.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.567,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 10,
"page_no": 14,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 54.28,
"t": 260.26,
"r": 279.26,
"b": 373.53,
"coord_origin": "TOPLEFT"
},
"confidence": 0.775,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 20,
"page_no": 14,
"cluster": {
"id": 20,
"label": "picture",
"bbox": {
"l": 323.47,
"t": 362.45,
"r": 525.96,
"b": 464.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.552,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 9,
"page_no": 14,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 323.47,
"t": 362.45,
"r": 525.96,
"b": 464.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.776,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 5,
"page_no": 14,
"cluster": {
"id": 5,
"label": "picture",
"bbox": {
"l": 55.42,
"t": 384.56,
"r": 280.23,
"b": 497.56,
"coord_origin": "TOPLEFT"
},
"confidence": 0.841,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 22,
"page_no": 14,
"cluster": {
"id": 22,
"label": "picture",
"bbox": {
"l": 353.69,
"t": 487.41,
"r": 495.43,
"b": 635.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.548,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 8,
"page_no": 14,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 353.69,
"t": 487.41,
"r": 495.43,
"b": 635.77,
"coord_origin": "TOPLEFT"
},
"confidence": 0.781,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 7,
"page_no": 14,
"cluster": {
"id": 7,
"label": "picture",
"bbox": {
"l": 50.65,
"t": 505.98,
"r": 319.91,
"b": 631.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.806,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 11,
"page_no": 14,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 50.65,
"t": 505.98,
"r": 319.91,
"b": 631.26,
"coord_origin": "TOPLEFT"
},
"confidence": 0.684,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
],
"headers": [
{
"label": "page_footer",
"id": 3,
"page_no": 14,
"cluster": {
"id": 3,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.904,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "15"
}
]
}
},
{
"page_no": 15,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 517.24,
"r_x1": 545.11,
"r_y1": 517.24,
"r_x2": 545.11,
"r_y2": 508.34,
"r_x3": 50.11,
"r_y3": 508.34,
"coord_origin": "TOPLEFT"
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 529.2,
"r_x1": 173.24,
"r_y1": 529.2,
"r_x2": 173.24,
"r_y2": 520.29,
"r_x3": 50.11,
"r_y3": 520.29,
"coord_origin": "TOPLEFT"
},
"text": "ing and prediction of structure.",
"orig": "ing and prediction of structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 0,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 508.34,
"r": 545.11,
"b": 529.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 517.24,
"r_x1": 545.11,
"r_y1": 517.24,
"r_x2": 545.11,
"r_y2": 508.34,
"r_x3": 50.11,
"r_y3": 508.34,
"coord_origin": "TOPLEFT"
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 529.2,
"r_x1": 173.24,
"r_y1": 529.2,
"r_x2": 173.24,
"r_y2": 520.29,
"r_x3": 50.11,
"r_y3": 520.29,
"coord_origin": "TOPLEFT"
},
"text": "ing and prediction of structure.",
"orig": "ing and prediction of structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "picture",
"bbox": {
"l": 66.8,
"t": 253.62,
"r": 528.56,
"b": 498.14,
"coord_origin": "TOPLEFT"
},
"confidence": 0.691,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "caption",
"id": 0,
"page_no": 15,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 508.34,
"r": 545.11,
"b": 529.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 517.24,
"r_x1": 545.11,
"r_y1": 517.24,
"r_x2": 545.11,
"r_y2": 508.34,
"r_x3": 50.11,
"r_y3": 508.34,
"coord_origin": "TOPLEFT"
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 529.2,
"r_x1": 173.24,
"r_y1": 529.2,
"r_x2": 173.24,
"r_y2": 520.29,
"r_x3": 50.11,
"r_y3": 520.29,
"coord_origin": "TOPLEFT"
},
"text": "ing and prediction of structure.",
"orig": "ing and prediction of structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure."
},
{
"label": "page_footer",
"id": 1,
"page_no": 15,
"cluster": {
"id": 1,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "16"
},
{
"label": "picture",
"id": 2,
"page_no": 15,
"cluster": {
"id": 2,
"label": "picture",
"bbox": {
"l": 66.8,
"t": 253.62,
"r": 528.56,
"b": 498.14,
"coord_origin": "TOPLEFT"
},
"confidence": 0.691,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"body": [
{
"label": "caption",
"id": 0,
"page_no": 15,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 50.11,
"t": 508.34,
"r": 545.11,
"b": 529.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.962,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 517.24,
"r_x1": 545.11,
"r_y1": 517.24,
"r_x2": 545.11,
"r_y2": 508.34,
"r_x3": 50.11,
"r_y3": 508.34,
"coord_origin": "TOPLEFT"
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.11,
"r_y0": 529.2,
"r_x1": 173.24,
"r_y1": 529.2,
"r_x2": 173.24,
"r_y2": 520.29,
"r_x3": 50.11,
"r_y3": 520.29,
"coord_origin": "TOPLEFT"
},
"text": "ing and prediction of structure.",
"orig": "ing and prediction of structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure."
},
{
"label": "picture",
"id": 2,
"page_no": 15,
"cluster": {
"id": 2,
"label": "picture",
"bbox": {
"l": 66.8,
"t": 253.62,
"r": 528.56,
"b": 498.14,
"coord_origin": "TOPLEFT"
},
"confidence": 0.691,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"headers": [
{
"label": "page_footer",
"id": 1,
"page_no": 15,
"cluster": {
"id": 1,
"label": "page_footer",
"bbox": {
"l": 292.63,
"t": 734.13,
"r": 302.59,
"b": 743.04,
"coord_origin": "TOPLEFT"
},
"confidence": 0.913,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.63,
"r_y0": 743.04,
"r_x1": 302.59,
"r_y1": 743.04,
"r_x2": 302.59,
"r_y2": 734.13,
"r_x3": 292.63,
"r_y3": 734.13,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "16"
}
]
}
}
] |